In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
from pathlib import Path
import pandas as pd
import numpy as np
import itertools
from copy import copy
from pprint import pprint
import plotly.express as px
import plotly.graph_objects as go
from plotly.subplots import make_subplots

import abc
import sys
import re
sys.path.append("../")
import gpusims
import gpusims.plot.metrics as metric
from gpusims.plot.data import PlotData
from gpusims.config import Config, parse_configs
from gpusims.bench import parse_benchmarks

In [3]:
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)

In [4]:
root_dir = Path("/Users/roman/dev/gpgpusims")
benchmark_dir = root_dir / "benchmarks"
run_dir = root_dir / "run"
assert benchmark_dir.is_dir()
assert run_dir.is_dir()

In [5]:
configs = parse_configs(benchmark_dir / "configs" / "configs.yml")
benchmarks = parse_benchmarks(benchmark_dir / "benchmarks.yml")

pprint(configs)
pprint(benchmarks)
pprint(gpusims.SIMULATORS)

{'sm6_gtx1080': Config(key='sm6_gtx1080', name='GTX 1080', path=PosixPath('/Users/roman/dev/gpgpusims/benchmarks/configs/SM6_GTX1080'), spec={'sm_count': 28, 'clock_speed': 1481}),
 'sm86_rtx3070': Config(key='sm86_rtx3070', name='RTX 3070', path=PosixPath('/Users/roman/dev/gpgpusims/benchmarks/configs/SM86_RTX3070'), spec={'sm_count': 46, 'clock_speed': 1132})}
{'babelstream': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/BabelStream),
 'cuda10-matrixmul': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/CUDA10-matrixMul),
 'cuda10-transpose': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/CUDA10-transpose),
 'cuda4-matrixmul': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/CUDA4-matrixMul),
 'cuda6-transpose': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/CUDA6-transpose),
 'vectoradd': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/vectorAdd)}
{'accelsim-ptx': <class 'gpusims.accelsim.AccelSimPTXBenchmarkConfig'>,
 'accelsim-sass': <class 'gpusims.accelsim_sass.AccelSimSASSBen

In [14]:
selected_simulators = copy(gpusims.SIMULATORS)
selected_configs = copy(configs)
selected_benchmarks = copy(benchmarks)

# for testing
if False:
    testing_simulators = None
    testing_configs = None
    testing_benchmarks = None
    # testing_simulators = list(gpusims.SIMULATORS.keys())
    # testing_simulators = [gpusims.NATIVE]
    # testing_simulators = [gpusims.MULTI2SIM]
    # testing_configs = ["sm6_gtx1080"]
    # testing_benchmarks = ["babelstream"] # "cuda6-transpose"]
    
    if testing_simulators is not None:
        selected_simulators = {k: v for k, v in gpusims.SIMULATORS.items() if k in testing_simulators}
    if testing_configs is not None:
        selected_configs = {k: v for k, v in configs.items() if k in testing_configs}
    if testing_benchmarks is not None:
        selected_benchmarks = {k: v for k, v in benchmarks.items() if k in testing_benchmarks}

pprint(selected_simulators)
pprint(selected_configs)
pprint(selected_benchmarks)

{'accelsim-ptx': <class 'gpusims.accelsim.AccelSimPTXBenchmarkConfig'>,
 'accelsim-sass': <class 'gpusims.accelsim_sass.AccelSimSASSBenchmarkConfig'>,
 'm2s': <class 'gpusims.multi2sim.Multi2SimBenchmarkConfig'>,
 'macsim': <class 'gpusims.macsim.MacSimBenchmarkConfig'>,
 'native': <class 'gpusims.native.NativeBenchmarkConfig'>,
 'tejas': <class 'gpusims.tejas.TejasBenchmarkConfig'>}
{'sm6_gtx1080': Config(key='sm6_gtx1080', name='GTX 1080', path=PosixPath('/Users/roman/dev/gpgpusims/benchmarks/configs/SM6_GTX1080'), spec={'sm_count': 28, 'clock_speed': 1481}),
 'sm86_rtx3070': Config(key='sm86_rtx3070', name='RTX 3070', path=PosixPath('/Users/roman/dev/gpgpusims/benchmarks/configs/SM86_RTX3070'), spec={'sm_count': 46, 'clock_speed': 1132})}
{'babelstream': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/BabelStream),
 'cuda10-matrixmul': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/CUDA10-matrixMul),
 'cuda10-transpose': Benchmark(/Users/roman/dev/gpgpusims/benchmarks/CUDA10-transp

In [15]:
colors= ['#0F8C79','#BD2D28','#E3BA22','#E6842A','#137B80','#8E6C8A','#9A3E25', '#E6842A']
colors= ["#5c0048", "#584588", "#3e78b7", "#39a8d1", "#70d5dd", "#b9ffe9"]
sim_color = {
    "GPUTejas": colors[1], # colors[0] not a nice color
    "AccelSim PTX": colors[2],
    "AccelSim SASS": colors[3],
    "Hardware": "#fe5901", # colors[3],
    "Multi2Sim": colors[4],
    "MacSim": colors[5],
}

In [18]:
def plot_bars(data, debug=False, fontsize=14, font_family="Helvetica"):
    metrics = {
        "Cycles": gpusims.plot.metrics.Cycles(data),
        "Execution Time": gpusims.plot.metrics.ExecutionTime(data),
        "Total L2 Read Hits": gpusims.plot.metrics.L2ReadHit(data),
        "Total DRAM Reads": gpusims.plot.metrics.DRAMReads(data),
        "Total DRAM Writes": gpusims.plot.metrics.DRAMWrites(data),
        "Total IPC": gpusims.plot.metrics.IPC(data),
        "Total Instruction Count": gpusims.plot.metrics.InstructionCount(data),
    }
    if False:
        for metric_name, metric in metrics.items():
            print("######", metric_name)
            print(metric.compute())
    
    for metric_name, metric in metrics.items():
        bars = []
        metric_df = metric.compute()
        for sim in metric_df.index:
            # add hardware GPU name
            name = sim
            if sim == "Hardware": #  and metric.hw_df is not None:
                # gpu_name = metric.hw_df.index.get_level_values("Device")[0]
                # name += f" ({gpu_name})"
                name += f" ({data.config.name})"
            bars.append(go.Bar(
                # x= [i],
                # y= [cycles],
                # x should be benchmarks
                x = [f"{data.benchmark.name} {data.inp.args}"], # cycle_df.index,
                y = metric_df.loc[sim],
                text = metric_df.loc[sim],
                textposition='auto',
                # textposition='inside',
                textfont = dict(
                    # color="white",
                    size=fontsize - 2,
                    color="black",
                ),
                # hovertext=name,
                hovertemplate = (
                    "<b>%{x}</b><br>" +
                    "%{y:.2f}<br>"
                ),
                name=name,
                # marker=go.bar.Marker(color=colors[i % len(colors)]),
                marker=dict(
                    color=sim_color[sim],
                    # color='rgba(50, 171, 96, 0.6)',
                    line=dict(
                        color='rgba(50, 171, 96, 1.0)',
                        width=0
                    ),
                ),
                # xaxis='x1',
            ))

        margin = 50
        yaxis_text = metric_name
        if metric.config.get("unit") is not None:
            yaxis_text += f" [{metric.config.get('unit')}]"
        layout = go.Layout(
            font_family=font_family,
            font_color="black",
            font_size=fontsize,
            title=dict(
                text=f"{metric_name} for {data.benchmark.name} ({data.config.name})",
                x=0.5,
                y=0.95,
                xanchor="center",
                yanchor="top",
            ),
            yaxis=go.layout.YAxis(
                title=yaxis_text,
                gridcolor="gray",
                zerolinecolor="gray",
                # type="log",
                # range=[min_axis_val * 0.9 ,max_axis_val*1.1]
            ),
            hoverlabel=dict(
                bgcolor="white",
                font_size=fontsize,
                font_family=font_family,
            ),
            barmode="group",
            bargroupgap=0.1,
            bargap=0.25,
            showlegend=True,
            plot_bgcolor="white",
            margin=dict(
                pad=10,
                autoexpand=True,
                l=margin, r=margin, t=1.5*margin, b=margin
            ),
            width=700,
            height=400,
        )
        if metric.config.get("log"):
            layout.yaxis.type = "log"
            # update_yaxes(type="log")
        fig = go.Figure(data=bars, layout=layout)
        # fig.show()
        filename = ["bar", metric_name, data.benchmark.name, data.config.key, data.inp.sanitized_name()]
        filename = Path("./figs") / gpusims.utils.slugify("_".join(filename))
        filename = filename.with_suffix(".pdf")
        fig.write_image(filename, format='pdf')

In [19]:
# => per config, benchmark and input, plot bars for each simulator

debug = None
for (config_name, config), (bench_name, bench) in itertools.product(
    selected_configs.items(),
    selected_benchmarks.items()
):
    print(config_name, bench_name)
    for inp in bench.inputs:
        plot_data = PlotData(benchmark=bench, config=config, inp=inp)
        for (sim_name, sim) in selected_simulators.items():
            if not bench.enabled(sim_name):
                continue
            print(sim_name, config_name, bench_name)
            bench_config = sim(
                run_dir=run_dir / sim_name.lower(),
                benchmark=bench,
                config=config,
            )
            plot_data[sim_name] = bench_config.load_dataframe(inp)
        
        # print(plot_data.get(gpusims.MULTI2SIM))
        # if plot_data.get(gpusims.MULTI2SIM) is not None:
        #    debug = plot_data[gpusims.MULTI2SIM]
        #    break
        plot_bars(plot_data)

# plot_data[gpusims.MULTI2SIM]

sm6_gtx1080 vectoradd
native sm6_gtx1080 vectoradd
accelsim-ptx sm6_gtx1080 vectoradd
accelsim-sass sm6_gtx1080 vectoradd
tejas sm6_gtx1080 vectoradd
macsim sm6_gtx1080 vectoradd
native sm6_gtx1080 vectoradd
accelsim-ptx sm6_gtx1080 vectoradd
accelsim-sass sm6_gtx1080 vectoradd
tejas sm6_gtx1080 vectoradd
macsim sm6_gtx1080 vectoradd
sm6_gtx1080 cuda10-transpose
native sm6_gtx1080 cuda10-transpose
accelsim-ptx sm6_gtx1080 cuda10-transpose
accelsim-sass sm6_gtx1080 cuda10-transpose
sm6_gtx1080 cuda6-transpose
native sm6_gtx1080 cuda6-transpose
accelsim-ptx sm6_gtx1080 cuda6-transpose
accelsim-sass sm6_gtx1080 cuda6-transpose
tejas sm6_gtx1080 cuda6-transpose
m2s sm6_gtx1080 cuda6-transpose
macsim sm6_gtx1080 cuda6-transpose
sm6_gtx1080 cuda10-matrixmul
native sm6_gtx1080 cuda10-matrixmul
accelsim-ptx sm6_gtx1080 cuda10-matrixmul
accelsim-sass sm6_gtx1080 cuda10-matrixmul
sm6_gtx1080 cuda4-matrixmul
native sm6_gtx1080 cuda4-matrixmul
accelsim-ptx sm6_gtx1080 cuda4-matrixmul
accelsim-sass

In [43]:
# debug dataframe
# sim = gpusims.MULTI2SIM
# sim = gpusims.MACSIM
# sim = gpusims.TEJAS
sim = gpusims.NATIVE
# benchmark = benchmarks["cuda4-matrixmul"]
benchmark = benchmarks["cuda6-transpose"]
# config=configs["sm86_rtx3070"]
config=configs["sm6_gtx1080"]
bench_config = gpusims.SIMULATORS[sim](
    run_dir=run_dir / sim.lower(),
    benchmark=benchmark,
    config=config,
)
assert bench_config.benchmark.enabled(sim)
bench_input = bench_config.benchmark.inputs[0]
df = bench_config.load_dataframe(bench_input)
# pprint(df.columns.tolist())
# df.T[~df.T.index.str.contains(r"SM \d+")]
df

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,Unnamed: 3_level_0,Unnamed: 4_level_0,Block X,Block Y,Block Z,Duration,Dynamic SMem,Grid X,Grid Y,Grid Z,Registers Per Thread,Start,Static SMem,achieved_occupancy,achieved_occupancy_max,achieved_occupancy_min,achieved_occupancy_std,atomic_transactions,atomic_transactions_max,atomic_transactions_min,atomic_transactions_per_request,atomic_transactions_per_request_max,atomic_transactions_per_request_min,atomic_transactions_per_request_std,atomic_transactions_std,branch_efficiency,branch_efficiency_max,branch_efficiency_min,branch_efficiency_std,cf_executed,cf_executed_max,cf_executed_min,cf_executed_std,cf_issued,cf_issued_max,cf_issued_min,cf_issued_std,dram_read_bytes,dram_read_bytes_max,dram_read_bytes_min,dram_read_bytes_std,dram_read_throughput,dram_read_throughput_max,dram_read_throughput_min,dram_read_throughput_std,dram_read_transactions,dram_read_transactions_max,dram_read_transactions_min,dram_read_transactions_std,dram_write_bytes,dram_write_bytes_max,dram_write_bytes_min,dram_write_bytes_std,dram_write_throughput,dram_write_throughput_max,dram_write_throughput_min,dram_write_throughput_std,dram_write_transactions,dram_write_transactions_max,dram_write_transactions_min,dram_write_transactions_std,ecc_throughput,ecc_throughput_max,ecc_throughput_min,ecc_throughput_std,ecc_transactions,ecc_transactions_max,ecc_transactions_min,ecc_transactions_std,elapsed_cycles_sm,elapsed_cycles_sm_max,elapsed_cycles_sm_min,elapsed_cycles_sm_std,eligible_warps_per_cycle,eligible_warps_per_cycle_max,eligible_warps_per_cycle_min,eligible_warps_per_cycle_std,flop_count_dp,flop_count_dp_add,flop_count_dp_add_max,flop_count_dp_add_min,flop_count_dp_add_std,flop_count_dp_fma,flop_count_dp_fma_max,flop_count_dp_fma_min,flop_count_dp_fma_std,flop_count_dp_max,flop_count_dp_min,flop_count_dp_mul,flop_count_dp_mul_max,flop_count_dp_mul_min,flop_count_dp_mul_std,flop_count_dp_std,flop_count_hp,flop_count_hp_add,flop_count_hp_add_max,flop_count_hp_add_min,flop_count_hp_add_std,flop_count_hp_fma,flop_count_hp_fma_max,flop_count_hp_fma_min,flop_count_hp_fma_std,flop_count_hp_max,flop_count_hp_min,flop_count_hp_mul,flop_count_hp_mul_max,flop_count_hp_mul_min,flop_count_hp_mul_std,flop_count_hp_std,flop_count_sp,flop_count_sp_add,flop_count_sp_add_max,flop_count_sp_add_min,flop_count_sp_add_std,flop_count_sp_fma,flop_count_sp_fma_max,flop_count_sp_fma_min,flop_count_sp_fma_std,flop_count_sp_max,flop_count_sp_min,flop_count_sp_mul,flop_count_sp_mul_max,flop_count_sp_mul_min,flop_count_sp_mul_std,flop_count_sp_special,flop_count_sp_special_max,flop_count_sp_special_min,flop_count_sp_special_std,flop_count_sp_std,flop_dp_efficiency,flop_dp_efficiency_max,flop_dp_efficiency_min,flop_dp_efficiency_std,flop_hp_efficiency,flop_hp_efficiency_max,flop_hp_efficiency_min,flop_hp_efficiency_std,flop_sp_efficiency,flop_sp_efficiency_max,flop_sp_efficiency_min,flop_sp_efficiency_std,gld_efficiency,gld_efficiency_max,gld_efficiency_min,gld_efficiency_std,gld_requested_throughput,gld_requested_throughput_max,gld_requested_throughput_min,gld_requested_throughput_std,gld_throughput,gld_throughput_max,gld_throughput_min,gld_throughput_std,gld_transactions,gld_transactions_max,gld_transactions_min,gld_transactions_per_request,gld_transactions_per_request_max,gld_transactions_per_request_min,gld_transactions_per_request_std,gld_transactions_std,global_atomic_requests,global_atomic_requests_max,global_atomic_requests_min,global_atomic_requests_std,global_hit_rate,global_hit_rate_max,global_hit_rate_min,global_hit_rate_std,global_load_requests,global_load_requests_max,global_load_requests_min,global_load_requests_std,global_reduction_requests,global_reduction_requests_max,global_reduction_requests_min,global_reduction_requests_std,global_store_requests,global_store_requests_max,global_store_requests_min,global_store_requests_std,gst_efficiency,gst_efficiency_max,gst_efficiency_min,gst_efficiency_std,gst_requested_throughput,gst_requested_throughput_max,gst_requested_throughput_min,gst_requested_throughput_std,gst_throughput,gst_throughput_max,gst_throughput_min,gst_throughput_std,gst_transactions,gst_transactions_max,gst_transactions_min,gst_transactions_per_request,gst_transactions_per_request_max,gst_transactions_per_request_min,gst_transactions_per_request_std,gst_transactions_std,inst_bit_convert,inst_bit_convert_max,inst_bit_convert_min,inst_bit_convert_std,inst_compute_ld_st,inst_compute_ld_st_max,inst_compute_ld_st_min,inst_compute_ld_st_std,inst_control,inst_control_max,inst_control_min,inst_control_std,inst_executed,inst_executed_global_atomics,inst_executed_global_atomics_max,inst_executed_global_atomics_min,inst_executed_global_atomics_std,inst_executed_global_loads,inst_executed_global_loads_max,inst_executed_global_loads_min,inst_executed_global_loads_std,inst_executed_global_reductions,inst_executed_global_reductions_max,inst_executed_global_reductions_min,inst_executed_global_reductions_std,inst_executed_global_stores,inst_executed_global_stores_max,inst_executed_global_stores_min,inst_executed_global_stores_std,inst_executed_local_loads,inst_executed_local_loads_max,inst_executed_local_loads_min,inst_executed_local_loads_std,inst_executed_local_stores,inst_executed_local_stores_max,inst_executed_local_stores_min,inst_executed_local_stores_std,inst_executed_max,inst_executed_min,inst_executed_shared_atomics,inst_executed_shared_atomics_max,inst_executed_shared_atomics_min,inst_executed_shared_atomics_std,inst_executed_shared_loads,inst_executed_shared_loads_max,inst_executed_shared_loads_min,inst_executed_shared_loads_std,inst_executed_shared_stores,inst_executed_shared_stores_max,inst_executed_shared_stores_min,inst_executed_shared_stores_std,...,l2_read_transactions_min,l2_read_transactions_std,l2_surface_atomic_store_bytes,l2_surface_atomic_store_bytes_max,l2_surface_atomic_store_bytes_min,l2_surface_atomic_store_bytes_std,l2_surface_load_bytes,l2_surface_load_bytes_max,l2_surface_load_bytes_min,l2_surface_load_bytes_std,l2_surface_reduction_bytes,l2_surface_reduction_bytes_max,l2_surface_reduction_bytes_min,l2_surface_reduction_bytes_std,l2_surface_store_bytes,l2_surface_store_bytes_max,l2_surface_store_bytes_min,l2_surface_store_bytes_std,l2_tex_hit_rate,l2_tex_hit_rate_max,l2_tex_hit_rate_min,l2_tex_hit_rate_std,l2_tex_read_hit_rate,l2_tex_read_hit_rate_max,l2_tex_read_hit_rate_min,l2_tex_read_hit_rate_std,l2_tex_read_throughput,l2_tex_read_throughput_max,l2_tex_read_throughput_min,l2_tex_read_throughput_std,l2_tex_read_transactions,l2_tex_read_transactions_max,l2_tex_read_transactions_min,l2_tex_read_transactions_std,l2_tex_write_hit_rate,l2_tex_write_hit_rate_max,l2_tex_write_hit_rate_min,l2_tex_write_hit_rate_std,l2_tex_write_throughput,l2_tex_write_throughput_max,l2_tex_write_throughput_min,l2_tex_write_throughput_std,l2_tex_write_transactions,l2_tex_write_transactions_max,l2_tex_write_transactions_min,l2_tex_write_transactions_std,l2_write_throughput,l2_write_throughput_max,l2_write_throughput_min,l2_write_throughput_std,l2_write_transactions,l2_write_transactions_max,l2_write_transactions_min,l2_write_transactions_std,ldst_executed,ldst_executed_max,ldst_executed_min,ldst_executed_std,ldst_issued,ldst_issued_max,ldst_issued_min,ldst_issued_std,local_hit_rate,local_hit_rate_max,local_hit_rate_min,local_hit_rate_std,local_load_requests,local_load_requests_max,local_load_requests_min,local_load_requests_std,local_load_throughput,local_load_throughput_max,local_load_throughput_min,local_load_throughput_std,local_load_transactions,local_load_transactions_max,local_load_transactions_min,local_load_transactions_per_request,local_load_transactions_per_request_max,local_load_transactions_per_request_min,local_load_transactions_per_request_std,local_load_transactions_std,local_memory_overhead,local_memory_overhead_max,local_memory_overhead_min,local_memory_overhead_std,local_store_requests,local_store_requests_max,local_store_requests_min,local_store_requests_std,local_store_throughput,local_store_throughput_max,local_store_throughput_min,local_store_throughput_std,local_store_transactions,local_store_transactions_max,local_store_transactions_min,local_store_transactions_per_request,local_store_transactions_per_request_max,local_store_transactions_per_request_min,local_store_transactions_per_request_std,local_store_transactions_std,pcie_total_data_received,pcie_total_data_received_max,pcie_total_data_received_min,pcie_total_data_received_std,pcie_total_data_transmitted,pcie_total_data_transmitted_max,pcie_total_data_transmitted_min,pcie_total_data_transmitted_std,shared_efficiency,shared_efficiency_max,shared_efficiency_min,shared_efficiency_std,shared_load_throughput,shared_load_throughput_max,shared_load_throughput_min,shared_load_throughput_std,shared_load_transactions,shared_load_transactions_max,shared_load_transactions_min,shared_load_transactions_per_request,shared_load_transactions_per_request_max,shared_load_transactions_per_request_min,shared_load_transactions_per_request_std,shared_load_transactions_std,shared_store_throughput,shared_store_throughput_max,shared_store_throughput_min,shared_store_throughput_std,shared_store_transactions,shared_store_transactions_max,shared_store_transactions_min,shared_store_transactions_per_request,shared_store_transactions_per_request_max,shared_store_transactions_per_request_min,shared_store_transactions_per_request_std,shared_store_transactions_std,sm_efficiency,sm_efficiency_max,sm_efficiency_min,sm_efficiency_std,stall_constant_memory_dependency,stall_constant_memory_dependency_max,stall_constant_memory_dependency_min,stall_constant_memory_dependency_std,stall_exec_dependency,stall_exec_dependency_max,stall_exec_dependency_min,stall_exec_dependency_std,stall_inst_fetch,stall_inst_fetch_max,stall_inst_fetch_min,stall_inst_fetch_std,stall_memory_dependency,stall_memory_dependency_max,stall_memory_dependency_min,stall_memory_dependency_std,stall_memory_throttle,stall_memory_throttle_max,stall_memory_throttle_min,stall_memory_throttle_std,stall_not_selected,stall_not_selected_max,stall_not_selected_min,stall_not_selected_std,stall_other,stall_other_max,stall_other_min,stall_other_std,stall_pipe_busy,stall_pipe_busy_max,stall_pipe_busy_min,stall_pipe_busy_std,stall_sync,stall_sync_max,stall_sync_min,stall_sync_std,stall_texture,stall_texture_max,stall_texture_min,stall_texture_std,surface_atomic_requests,surface_atomic_requests_max,surface_atomic_requests_min,surface_atomic_requests_std,surface_load_requests,surface_load_requests_max,surface_load_requests_min,surface_load_requests_std,surface_reduction_requests,surface_reduction_requests_max,surface_reduction_requests_min,surface_reduction_requests_std,surface_store_requests,surface_store_requests_max,surface_store_requests_min,surface_store_requests_std,sysmem_read_bytes,sysmem_read_bytes_max,sysmem_read_bytes_min,sysmem_read_bytes_std,sysmem_read_throughput,sysmem_read_throughput_max,sysmem_read_throughput_min,sysmem_read_throughput_std,sysmem_read_transactions,sysmem_read_transactions_max,sysmem_read_transactions_min,sysmem_read_transactions_std,sysmem_write_bytes,sysmem_write_bytes_max,sysmem_write_bytes_min,sysmem_write_bytes_std,sysmem_write_throughput,sysmem_write_throughput_max,sysmem_write_throughput_min,sysmem_write_throughput_std,sysmem_write_transactions,sysmem_write_transactions_max,sysmem_write_transactions_min,sysmem_write_transactions_std,tex_cache_hit_rate,tex_cache_hit_rate_max,tex_cache_hit_rate_min,tex_cache_hit_rate_std,tex_cache_throughput,tex_cache_throughput_max,tex_cache_throughput_min,tex_cache_throughput_std,tex_cache_transactions,tex_cache_transactions_max,tex_cache_transactions_min,tex_cache_transactions_std,texture_load_requests,texture_load_requests_max,texture_load_requests_min,texture_load_requests_std,unique_warps_launched,unique_warps_launched_max,unique_warps_launched_min,unique_warps_launched_std,warp_execution_efficiency,warp_execution_efficiency_max,warp_execution_efficiency_min,warp_execution_efficiency_std,warp_nonpred_execution_efficiency,warp_nonpred_execution_efficiency_max,warp_nonpred_execution_efficiency_min,warp_nonpred_execution_efficiency_std
Stream,Context,Device,Kernel,Correlation_ID,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1,Unnamed: 90_level_1,Unnamed: 91_level_1,Unnamed: 92_level_1,Unnamed: 93_level_1,Unnamed: 94_level_1,Unnamed: 95_level_1,Unnamed: 96_level_1,Unnamed: 97_level_1,Unnamed: 98_level_1,Unnamed: 99_level_1,Unnamed: 100_level_1,Unnamed: 101_level_1,Unnamed: 102_level_1,Unnamed: 103_level_1,Unnamed: 104_level_1,Unnamed: 105_level_1,Unnamed: 106_level_1,Unnamed: 107_level_1,Unnamed: 108_level_1,Unnamed: 109_level_1,Unnamed: 110_level_1,Unnamed: 111_level_1,Unnamed: 112_level_1,Unnamed: 113_level_1,Unnamed: 114_level_1,Unnamed: 115_level_1,Unnamed: 116_level_1,Unnamed: 117_level_1,Unnamed: 118_level_1,Unnamed: 119_level_1,Unnamed: 120_level_1,Unnamed: 121_level_1,Unnamed: 122_level_1,Unnamed: 123_level_1,Unnamed: 124_level_1,Unnamed: 125_level_1,Unnamed: 126_level_1,Unnamed: 127_level_1,Unnamed: 128_level_1,Unnamed: 129_level_1,Unnamed: 130_level_1,Unnamed: 131_level_1,Unnamed: 132_level_1,Unnamed: 133_level_1,Unnamed: 134_level_1,Unnamed: 135_level_1,Unnamed: 136_level_1,Unnamed: 137_level_1,Unnamed: 138_level_1,Unnamed: 139_level_1,Unnamed: 140_level_1,Unnamed: 141_level_1,Unnamed: 142_level_1,Unnamed: 143_level_1,Unnamed: 144_level_1,Unnamed: 145_level_1,Unnamed: 146_level_1,Unnamed: 147_level_1,Unnamed: 148_level_1,Unnamed: 149_level_1,Unnamed: 150_level_1,Unnamed: 151_level_1,Unnamed: 152_level_1,Unnamed: 153_level_1,Unnamed: 154_level_1,Unnamed: 155_level_1,Unnamed: 156_level_1,Unnamed: 157_level_1,Unnamed: 158_level_1,Unnamed: 159_level_1,Unnamed: 160_level_1,Unnamed: 161_level_1,Unnamed: 162_level_1,Unnamed: 163_level_1,Unnamed: 164_level_1,Unnamed: 165_level_1,Unnamed: 166_level_1,Unnamed: 167_level_1,Unnamed: 168_level_1,Unnamed: 169_level_1,Unnamed: 170_level_1,Unnamed: 171_level_1,Unnamed: 172_level_1,Unnamed: 173_level_1,Unnamed: 174_level_1,Unnamed: 175_level_1,Unnamed: 176_level_1,Unnamed: 177_level_1,Unnamed: 178_level_1,Unnamed: 179_level_1,Unnamed: 180_level_1,Unnamed: 181_level_1,Unnamed: 182_level_1,Unnamed: 183_level_1,Unnamed: 184_level_1,Unnamed: 185_level_1,Unnamed: 186_level_1,Unnamed: 187_level_1,Unnamed: 188_level_1,Unnamed: 189_level_1,Unnamed: 190_level_1,Unnamed: 191_level_1,Unnamed: 192_level_1,Unnamed: 193_level_1,Unnamed: 194_level_1,Unnamed: 195_level_1,Unnamed: 196_level_1,Unnamed: 197_level_1,Unnamed: 198_level_1,Unnamed: 199_level_1,Unnamed: 200_level_1,Unnamed: 201_level_1,Unnamed: 202_level_1,Unnamed: 203_level_1,Unnamed: 204_level_1,Unnamed: 205_level_1,Unnamed: 206_level_1,Unnamed: 207_level_1,Unnamed: 208_level_1,Unnamed: 209_level_1,Unnamed: 210_level_1,Unnamed: 211_level_1,Unnamed: 212_level_1,Unnamed: 213_level_1,Unnamed: 214_level_1,Unnamed: 215_level_1,Unnamed: 216_level_1,Unnamed: 217_level_1,Unnamed: 218_level_1,Unnamed: 219_level_1,Unnamed: 220_level_1,Unnamed: 221_level_1,Unnamed: 222_level_1,Unnamed: 223_level_1,Unnamed: 224_level_1,Unnamed: 225_level_1,Unnamed: 226_level_1,Unnamed: 227_level_1,Unnamed: 228_level_1,Unnamed: 229_level_1,Unnamed: 230_level_1,Unnamed: 231_level_1,Unnamed: 232_level_1,Unnamed: 233_level_1,Unnamed: 234_level_1,Unnamed: 235_level_1,Unnamed: 236_level_1,Unnamed: 237_level_1,Unnamed: 238_level_1,Unnamed: 239_level_1,Unnamed: 240_level_1,Unnamed: 241_level_1,Unnamed: 242_level_1,Unnamed: 243_level_1,Unnamed: 244_level_1,Unnamed: 245_level_1,Unnamed: 246_level_1,Unnamed: 247_level_1,Unnamed: 248_level_1,Unnamed: 249_level_1,Unnamed: 250_level_1,Unnamed: 251_level_1,Unnamed: 252_level_1,Unnamed: 253_level_1,Unnamed: 254_level_1,Unnamed: 255_level_1,Unnamed: 256_level_1,Unnamed: 257_level_1,Unnamed: 258_level_1,Unnamed: 259_level_1,Unnamed: 260_level_1,Unnamed: 261_level_1,Unnamed: 262_level_1,Unnamed: 263_level_1,Unnamed: 264_level_1,Unnamed: 265_level_1,Unnamed: 266_level_1,Unnamed: 267_level_1,Unnamed: 268_level_1,Unnamed: 269_level_1,Unnamed: 270_level_1,Unnamed: 271_level_1,Unnamed: 272_level_1,Unnamed: 273_level_1,Unnamed: 274_level_1,Unnamed: 275_level_1,Unnamed: 276_level_1,Unnamed: 277_level_1,Unnamed: 278_level_1,Unnamed: 279_level_1,Unnamed: 280_level_1,Unnamed: 281_level_1,Unnamed: 282_level_1,Unnamed: 283_level_1,Unnamed: 284_level_1,Unnamed: 285_level_1,Unnamed: 286_level_1,Unnamed: 287_level_1,Unnamed: 288_level_1,Unnamed: 289_level_1,Unnamed: 290_level_1,Unnamed: 291_level_1,Unnamed: 292_level_1,Unnamed: 293_level_1,Unnamed: 294_level_1,Unnamed: 295_level_1,Unnamed: 296_level_1,Unnamed: 297_level_1,Unnamed: 298_level_1,Unnamed: 299_level_1,Unnamed: 300_level_1,Unnamed: 301_level_1,Unnamed: 302_level_1,Unnamed: 303_level_1,Unnamed: 304_level_1,Unnamed: 305_level_1,Unnamed: 306_level_1,Unnamed: 307_level_1,Unnamed: 308_level_1,Unnamed: 309_level_1,Unnamed: 310_level_1,Unnamed: 311_level_1,Unnamed: 312_level_1,Unnamed: 313_level_1,Unnamed: 314_level_1,Unnamed: 315_level_1,Unnamed: 316_level_1,Unnamed: 317_level_1,Unnamed: 318_level_1,Unnamed: 319_level_1,Unnamed: 320_level_1,Unnamed: 321_level_1,Unnamed: 322_level_1,Unnamed: 323_level_1,Unnamed: 324_level_1,Unnamed: 325_level_1,Unnamed: 326_level_1,Unnamed: 327_level_1,Unnamed: 328_level_1,Unnamed: 329_level_1,Unnamed: 330_level_1,Unnamed: 331_level_1,Unnamed: 332_level_1,Unnamed: 333_level_1,Unnamed: 334_level_1,Unnamed: 335_level_1,Unnamed: 336_level_1,Unnamed: 337_level_1,Unnamed: 338_level_1,Unnamed: 339_level_1,Unnamed: 340_level_1,Unnamed: 341_level_1,Unnamed: 342_level_1,Unnamed: 343_level_1,Unnamed: 344_level_1,Unnamed: 345_level_1,Unnamed: 346_level_1,Unnamed: 347_level_1,Unnamed: 348_level_1,Unnamed: 349_level_1,Unnamed: 350_level_1,Unnamed: 351_level_1,Unnamed: 352_level_1,Unnamed: 353_level_1,Unnamed: 354_level_1,Unnamed: 355_level_1,Unnamed: 356_level_1,Unnamed: 357_level_1,Unnamed: 358_level_1,Unnamed: 359_level_1,Unnamed: 360_level_1,Unnamed: 361_level_1,Unnamed: 362_level_1,Unnamed: 363_level_1,Unnamed: 364_level_1,Unnamed: 365_level_1,Unnamed: 366_level_1,Unnamed: 367_level_1,Unnamed: 368_level_1,Unnamed: 369_level_1,Unnamed: 370_level_1,Unnamed: 371_level_1,Unnamed: 372_level_1,Unnamed: 373_level_1,Unnamed: 374_level_1,Unnamed: 375_level_1,Unnamed: 376_level_1,Unnamed: 377_level_1,Unnamed: 378_level_1,Unnamed: 379_level_1,Unnamed: 380_level_1,Unnamed: 381_level_1,Unnamed: 382_level_1,Unnamed: 383_level_1,Unnamed: 384_level_1,Unnamed: 385_level_1,Unnamed: 386_level_1,Unnamed: 387_level_1,Unnamed: 388_level_1,Unnamed: 389_level_1,Unnamed: 390_level_1,Unnamed: 391_level_1,Unnamed: 392_level_1,Unnamed: 393_level_1,Unnamed: 394_level_1,Unnamed: 395_level_1,Unnamed: 396_level_1,Unnamed: 397_level_1,Unnamed: 398_level_1,Unnamed: 399_level_1,Unnamed: 400_level_1,Unnamed: 401_level_1,Unnamed: 402_level_1,Unnamed: 403_level_1,Unnamed: 404_level_1,Unnamed: 405_level_1,Unnamed: 406_level_1,Unnamed: 407_level_1,Unnamed: 408_level_1,Unnamed: 409_level_1,Unnamed: 410_level_1,Unnamed: 411_level_1,Unnamed: 412_level_1,Unnamed: 413_level_1,Unnamed: 414_level_1,Unnamed: 415_level_1,Unnamed: 416_level_1,Unnamed: 417_level_1,Unnamed: 418_level_1,Unnamed: 419_level_1,Unnamed: 420_level_1,Unnamed: 421_level_1,Unnamed: 422_level_1,Unnamed: 423_level_1,Unnamed: 424_level_1,Unnamed: 425_level_1,Unnamed: 426_level_1,Unnamed: 427_level_1,Unnamed: 428_level_1,Unnamed: 429_level_1,Unnamed: 430_level_1,Unnamed: 431_level_1,Unnamed: 432_level_1,Unnamed: 433_level_1,Unnamed: 434_level_1,Unnamed: 435_level_1,Unnamed: 436_level_1,Unnamed: 437_level_1,Unnamed: 438_level_1,Unnamed: 439_level_1,Unnamed: 440_level_1,Unnamed: 441_level_1,Unnamed: 442_level_1,Unnamed: 443_level_1,Unnamed: 444_level_1,Unnamed: 445_level_1,Unnamed: 446_level_1,Unnamed: 447_level_1,Unnamed: 448_level_1,Unnamed: 449_level_1,Unnamed: 450_level_1,Unnamed: 451_level_1,Unnamed: 452_level_1,Unnamed: 453_level_1,Unnamed: 454_level_1,Unnamed: 455_level_1,Unnamed: 456_level_1,Unnamed: 457_level_1,Unnamed: 458_level_1,Unnamed: 459_level_1,Unnamed: 460_level_1,Unnamed: 461_level_1,Unnamed: 462_level_1,Unnamed: 463_level_1,Unnamed: 464_level_1,Unnamed: 465_level_1,Unnamed: 466_level_1,Unnamed: 467_level_1,Unnamed: 468_level_1,Unnamed: 469_level_1,Unnamed: 470_level_1,Unnamed: 471_level_1,Unnamed: 472_level_1,Unnamed: 473_level_1,Unnamed: 474_level_1,Unnamed: 475_level_1,Unnamed: 476_level_1,Unnamed: 477_level_1,Unnamed: 478_level_1,Unnamed: 479_level_1,Unnamed: 480_level_1,Unnamed: 481_level_1,Unnamed: 482_level_1,Unnamed: 483_level_1,Unnamed: 484_level_1,Unnamed: 485_level_1,Unnamed: 486_level_1,Unnamed: 487_level_1,Unnamed: 488_level_1,Unnamed: 489_level_1,Unnamed: 490_level_1,Unnamed: 491_level_1,Unnamed: 492_level_1,Unnamed: 493_level_1,Unnamed: 494_level_1,Unnamed: 495_level_1,Unnamed: 496_level_1,Unnamed: 497_level_1,Unnamed: 498_level_1,Unnamed: 499_level_1,Unnamed: 500_level_1,Unnamed: 501_level_1,Unnamed: 502_level_1,Unnamed: 503_level_1,Unnamed: 504_level_1,Unnamed: 505_level_1
7.0,1.0,NVIDIA GeForce GTX 1080,_Z13copySharedMemPfS_ii,134.0,16.0,16.0,1.0,2.176,0.0,2.0,2.0,1.0,9.0,301886.348333,1.0,0.123801,0.124365,0.123292,0.00044,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,64.0,64,64,0.0,64.0,64,64,0.0,3989.333333,7552,704,2802.553756,1.958343,3.699815,0.34801,1.371507,124.666667,236,22,87.579805,1941.333333,5440,0,2478.892943,0.951648,2.665121,0.0,1.214084,60.666667,170,0,77.465404,0.0,0.0,0.0,0.0,0.0,0,0,0.0,135558.333333,205250,96485,49400.189327,0.217575,0.317605,0.167179,0.070733,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,2.015897,2.024786,2.006679,0.007396,2.015897,2.024786,2.006679,0.007396,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,100.0,100.0,100.0,0.0,2.015897,2.024786,2.006679,0.007396,2.015897,2.024786,2.006679,0.007396,128.0,128,128,4.0,4,4,0.0,0.0,0.0,0,0,0.0,5120.0,5120,5120,0.0,1024.0,1024,1024,0.0,1152.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,1152,1152,0.0,0,0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,...,322,253.636661,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,91.666667,100.0,75.0,11.785113,100.0,100.0,100.0,0.0,2.015897,2.024786,2.006679,0.007396,128.0,128,128,0.0,83.333333,100.0,50.0,23.570226,2.015897,2.024786,2.006679,0.007396,128.0,128,128,0.0,2.388258,2.473026,2.230429,0.111704,151.666667,157,141,7.542472,352.0,352,352,0.0,512.0,512,512,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,170.666667,512,0,241.359115,170.666667,512,0,241.359115,100.0,100.0,100.0,0.0,2.015897,2.024786,2.006679,0.007396,32.0,32,32,1.0,1,1,0.0,0.0,2.015897,2.024786,2.006679,0.007396,32.0,32,32,1.0,1,1,0.0,0.0,4.468686,4.784738,4.089161,0.287493,32.019628,37.337857,26.740139,4.326587,12.792172,14.829853,11.08416,1.546839,29.001854,33.226991,25.21867,3.284285,12.934474,14.67034,11.356119,1.357601,0.067448,0.07734,0.058802,0.007619,0.075879,0.087007,0.066152,0.008572,7.196754,15.148842,2.970809,5.626676,0.370963,0.425367,0.323411,0.041904,5.540828,6.472351,4.762955,0.706265,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,80.63587,80.991449,80.26717,0.295831,5.0,5,5,0.0,50.0,50.0,50.0,0.0,2.015897,2.024786,2.006679,0.007396,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,97.222222,97.222222,97.222222,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z13copySharedMemPfS_ii,136.0,16.0,16.0,1.0,1.877333,0.0,2.0,2.0,1.0,9.0,301892.652333,1.0,0.124008,0.124404,0.123256,0.000532,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,64.0,64,64,0.0,64.0,64,64,0.0,15061.333333,22208,6080,6710.817006,7.284019,10.628372,3.002355,3.183075,470.666667,694,190,209.713031,2880.0,4288,128,1946.13326,1.400098,2.085847,0.062283,0.946078,90.0,134,4,60.816664,0.0,0.0,0.0,0.0,0.0,0,0,0.0,122840.0,137325,111560,10759.88925,0.200722,0.268366,0.166667,0.047832,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.991988,2.022639,1.960276,0.025471,1.991988,2.022639,1.960276,0.025471,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,100.0,100.0,100.0,0.0,1.991988,2.022639,1.960276,0.025471,1.991988,2.022639,1.960276,0.025471,128.0,128,128,4.0,4,4,0.0,0.0,0.0,0,0,0.0,5120.0,5120,5120,0.0,1024.0,1024,1024,0.0,1152.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,1152,1152,0.0,0,0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,...,220,128.170026,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,66.666667,100.0,25.0,31.180478,66.666667,100.0,0.0,47.140452,1.991988,2.022639,1.960276,0.025471,128.0,128,128,0.0,66.666667,100.0,50.0,23.570226,1.991988,2.022639,1.960276,0.025471,128.0,128,128,0.0,2.275978,2.404401,2.195469,0.091779,146.333333,157,141,7.542472,352.0,352,352,0.0,512.0,512,512,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,8192.0,24064,0,11225.145107,1024.0,3072,0,1448.154688,100.0,100.0,100.0,0.0,1.991988,2.022639,1.960276,0.025471,32.0,32,32,1.0,1,1,0.0,0.0,1.991988,2.022639,1.960276,0.025471,32.0,32,32,1.0,1,1,0.0,0.0,4.728858,6.548968,3.793103,1.287183,32.383067,38.70824,26.731141,4.91275,15.255546,17.451808,13.47924,1.648756,23.103167,33.046422,15.868417,7.269707,15.277088,17.343447,13.463639,1.593989,0.07998,0.091251,0.071319,0.008344,0.09072,0.102658,0.082462,0.008646,6.743911,12.02612,3.471954,3.770435,0.439889,0.501882,0.392253,0.045893,6.626632,7.670811,5.908311,0.75553,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,79.679532,80.905561,78.411043,1.018825,5.0,5,5,0.0,50.0,50.0,50.0,0.0,1.991988,2.022639,1.960276,0.025471,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,97.222222,97.222222,97.222222,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z13copySharedMemPfS_ii,138.0,16.0,16.0,1.0,1.877333,0.0,2.0,2.0,1.0,9.0,301896.428333,1.0,0.123423,0.123723,0.123255,0.000212,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,64.0,64,64,0.0,64.0,64,64,0.0,3392.0,8960,256,3947.646725,1.677951,4.436284,0.126014,1.95553,106.0,280,8,123.36396,170.666667,384,0,159.644049,0.083999,0.188622,0.0,0.078373,5.333333,12,0,4.988877,0.0,0.0,0.0,0.0,0.0,0,0,0.0,102375.0,107825,97520,4227.984153,0.318452,0.318922,0.318009,0.000373,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,2.018737,2.028016,2.011971,0.006787,2.018737,2.028016,2.011971,0.006787,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,100.0,100.0,100.0,0.0,2.018737,2.028016,2.011971,0.006787,2.018737,2.028016,2.011971,0.006787,128.0,128,128,4.0,4,4,0.0,0.0,0.0,0,0,0.0,5120.0,5120,5120,0.0,1024.0,1024,1024,0.0,1152.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,1152,1152,0.0,0,0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,...,192,131.141993,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,66.666667,100.0,25.0,31.180478,66.666667,100.0,0.0,47.140452,2.018737,2.028016,2.011971,0.006787,128.0,128,128,0.0,66.666667,100.0,50.0,23.570226,2.018737,2.028016,2.011971,0.006787,128.0,128,128,0.0,2.391607,2.473026,2.233986,0.111475,151.666667,157,141,7.542472,352.0,352,352,0.0,512.0,512,512,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,170.666667,512,0,241.359115,341.333333,512,0,241.359115,100.0,100.0,100.0,0.0,2.018737,2.028016,2.011971,0.006787,32.0,32,32,1.0,1,1,0.0,0.0,2.018737,2.028016,2.011971,0.006787,32.0,32,32,1.0,1,1,0.0,0.0,5.115159,5.958663,4.074668,0.781649,36.063944,38.398084,31.850278,2.985286,17.368298,21.12855,13.340429,3.185113,13.811718,20.3456,5.247793,6.328599,17.494626,20.764502,13.916977,2.803949,0.090905,0.109901,0.07096,0.015912,0.105327,0.127074,0.07983,0.019469,7.071496,12.160724,4.121936,3.613785,0.499977,0.604458,0.390279,0.087516,7.49371,9.142425,5.800958,1.364504,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,80.749486,81.120622,80.478845,0.27147,5.0,5,5,0.0,50.0,50.0,50.0,0.0,2.018737,2.028016,2.011971,0.006787,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,97.222222,97.222222,97.222222,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z13copySharedMemPfS_ii,140.0,16.0,16.0,1.0,1.866667,0.0,2.0,2.0,1.0,9.0,301900.172333,1.0,0.123998,0.124403,0.123256,0.000525,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,64.0,64,64,0.0,64.0,64,64,0.0,3733.333333,5632,256,2462.313997,1.838188,2.772309,0.126081,1.212319,116.666667,176,8,76.947312,1749.333333,4480,0,1956.163138,0.861485,2.206412,0.0,0.963449,54.666667,140,0,61.130098,0.0,0.0,0.0,0.0,0.0,0,0,0.0,103438.333333,112430,96855,6582.563246,0.231139,0.268209,0.157702,0.051929,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,2.016936,2.017291,2.016225,0.000503,2.016936,2.017291,2.016225,0.000503,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,100.0,100.0,100.0,0.0,2.016936,2.017291,2.016225,0.000503,2.016936,2.017291,2.016225,0.000503,128.0,128,128,4.0,4,4,0.0,0.0,0.0,0,0,0.0,5120.0,5120,5120,0.0,1024.0,1024,1024,0.0,1152.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,1152,1152,0.0,0,0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,...,464,134.831582,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,75.0,100.0,50.0,20.412415,66.666667,100.0,0.0,47.140452,2.016936,2.017291,2.016225,0.000503,128.0,128,128,0.0,83.333333,100.0,50.0,23.570226,2.016936,2.017291,2.016225,0.000503,128.0,128,128,0.0,2.389844,2.474333,2.222172,0.118563,151.666667,157,141,7.542472,352.0,352,352,0.0,512.0,512,512,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,170.666667,512,0,241.359115,170.666667,512,0,241.359115,100.0,100.0,100.0,0.0,2.016936,2.017291,2.016225,0.000503,32.0,32,32,1.0,1,1,0.0,0.0,2.016936,2.017291,2.016225,0.000503,32.0,32,32,1.0,1,1,0.0,0.0,5.968881,7.100864,4.092893,1.335947,33.17543,43.161032,20.750925,9.310009,13.459927,15.764053,11.509927,1.754699,11.966071,29.138225,2.854943,12.150112,21.924372,37.272027,12.898891,10.908402,0.070191,0.082211,0.060104,0.009128,0.079592,0.092488,0.069495,0.009593,11.9106,18.579666,3.06314,6.519187,0.393567,0.452163,0.353111,0.042423,7.020249,8.549802,5.65913,1.186107,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,80.677423,80.691639,80.648991,0.020104,5.0,5,5,0.0,50.0,50.0,50.0,0.0,2.016936,2.017291,2.016225,0.000503,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,97.222222,97.222222,97.222222,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z14transposeNaivePfS_ii,148.0,16.0,16.0,1.0,2.048,0.0,2.0,2.0,1.0,8.0,301938.178,0.0,0.122846,0.12347,0.122229,0.000507,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,13973.333333,23936,1024,9589.23248,6.735411,11.514534,0.494901,4.615901,436.666667,748,32,299.663515,1493.333333,4352,0,2022.057918,0.718472,2.093552,0.0,0.972657,46.666667,136,0,63.18931,0.0,0.0,0.0,0.0,0.0,0,0,0.0,114583.333333,142590,99830,19813.169582,0.245535,0.26202,0.212733,0.023194,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.976536,1.979604,1.970401,0.004338,1.976536,1.979604,1.970401,0.004338,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,12.5,12.5,12.5,0.0,1.976536,1.979604,1.970401,0.004338,15.812293,15.836833,15.763212,0.034705,1024.0,1024,1024,32.0,32,32,0.0,0.0,0.0,0,0,0.0,2048.0,2048,2048,0.0,1024.0,1024,1024,0.0,704.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,704,704,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,...,288,43.369216,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,90.740741,97.222222,86.111111,4.721314,33.333333,100.0,0.0,47.140452,1.976536,1.979604,1.970401,0.004338,128.0,128,128,0.0,97.916667,100.0,96.875,1.473139,15.812293,15.836833,15.763212,0.034705,1024.0,1024,1024,0.0,16.177619,16.285338,16.037887,0.103526,1047.666667,1053,1037,7.542472,192.0,192,192,0.0,384.0,384,384,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,341.333333,512,0,241.359115,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,3.969484,4.902407,3.13977,0.723285,41.85034,49.124996,37.573864,5.170363,8.940034,9.748206,7.658054,0.916717,10.639636,23.941483,3.630485,9.410373,32.646586,41.900428,21.254748,8.563072,2.377538,2.658602,1.920186,0.326213,0.038996,0.0422,0.034036,0.003557,3.243275,3.885078,2.609411,0.520819,0.263595,0.285268,0.238251,0.019369,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,79.061464,79.184167,78.816059,0.173528,5.0,5,5,0.0,10.0,10.0,10.0,0.0,1.976536,1.979604,1.970401,0.004338,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,100.0,100.0,100.0,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z14transposeNaivePfS_ii,150.0,16.0,16.0,1.0,1.92,0.0,2.0,2.0,1.0,8.0,301943.49,0.0,0.123033,0.12362,0.122261,0.00057,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,3072.0,7360,256,3081.319198,1.486269,3.562648,0.123277,1.491981,96.0,230,8,96.291225,1578.666667,4352,0,1967.298881,0.764034,2.106609,0.0,0.95236,49.333333,136,0,61.47809,0.0,0.0,0.0,0.0,0.0,0,0,0.0,148528.333333,200695,100400,41044.714303,0.262048,0.262274,0.261682,0.000261,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.977902,1.982691,1.972439,0.004212,1.977902,1.982691,1.972439,0.004212,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,12.5,12.5,12.5,0.0,1.977902,1.982691,1.972439,0.004212,15.82322,15.861527,15.779513,0.033699,1024.0,1024,1024,32.0,32,32,0.0,0.0,0.0,0,0,0.0,2048.0,2048,2048,0.0,1024.0,1024,1024,0.0,704.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,704,704,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,...,264,266.554977,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,92.592593,100.0,88.888889,5.237828,33.333333,100.0,0.0,47.140452,1.977902,1.982691,1.972439,0.004212,128.0,128,128,0.0,100.0,100.0,100.0,0.0,15.82322,15.861527,15.779513,0.033699,1024.0,1024,1024,0.0,16.106541,16.276891,15.979839,0.125137,1042.333333,1053,1037,7.542472,192.0,192,192,0.0,384.0,384,384,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,341.333333,512,0,241.359115,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,3.77995,5.209148,2.966398,1.01382,51.894066,59.534948,47.743713,5.40963,11.10836,12.039901,9.314805,1.268553,5.151732,5.540794,4.402862,0.529666,24.282622,26.248708,20.96863,2.356897,2.850332,3.220806,2.311502,0.389843,0.048407,0.052272,0.041277,0.005047,4.357909,4.98323,3.164557,0.844151,0.306574,0.331054,0.26142,0.031966,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,79.116099,79.307635,78.897565,0.168495,5.0,5,5,0.0,10.0,10.0,10.0,0.0,1.977902,1.982691,1.972439,0.004212,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,100.0,100.0,100.0,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z14transposeNaivePfS_ii,152.0,16.0,16.0,1.0,1.984,0.0,2.0,2.0,1.0,8.0,301947.180667,0.0,0.123185,0.123454,0.122767,0.000299,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,8832.0,18496,1920,7041.357445,4.233102,8.893001,0.921721,3.391086,276.0,578,60,220.04242,2816.0,4160,128,1900.703028,1.345089,2.000156,0.061448,0.907736,88.0,130,4,59.39697,0.0,0.0,0.0,0.0,0.0,0,0,0.0,105940.0,121650,97510,11118.564056,0.211841,0.26202,0.112997,0.069896,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.959674,1.969384,1.9433,0.011645,1.959674,1.969384,1.9433,0.011645,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,12.5,12.5,12.5,0.0,1.959674,1.969384,1.9433,0.011645,15.677394,15.755074,15.546397,0.093161,1024.0,1024,1024,32.0,32,32,0.0,0.0,0.0,0,0,0.0,2048.0,2048,2048,0.0,1024.0,1024,1024,0.0,704.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,704,704,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,...,288,312.590609,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,90.740741,97.222222,86.111111,4.721314,33.333333,100.0,0.0,47.140452,1.959674,1.969384,1.9433,0.011645,128.0,128,128,0.0,97.916667,100.0,96.875,1.473139,15.677394,15.755074,15.546397,0.093161,1024.0,1024,1024,0.0,15.957394,15.986676,15.930417,0.023025,1042.333333,1053,1037,7.542472,192.0,192,192,0.0,384.0,384,384,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,4.362958,4.838415,3.852723,0.403158,32.664245,33.869291,32.029623,0.852499,8.179697,8.473436,8.018977,0.208012,26.34159,37.597608,3.912698,15.859658,23.675385,36.510363,17.158698,9.076062,2.203041,2.268142,2.163851,0.046351,0.03541,0.036682,0.034714,0.000901,6.668218,14.672617,2.661421,5.659966,0.232415,0.256771,0.219857,0.017225,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,78.386969,78.775369,77.731987,0.465805,5.0,5,5,0.0,10.0,10.0,10.0,0.0,1.959674,1.969384,1.9433,0.011645,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,100.0,100.0,100.0,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z14transposeNaivePfS_ii,154.0,16.0,16.0,1.0,1.931,0.0,2.0,2.0,1.0,8.0,301951.202,0.0,0.122962,0.123102,0.122761,0.000146,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,14293.333333,32384,5056,12792.993638,6.887186,15.67565,2.429704,6.214597,446.666667,1012,158,399.781051,1514.666667,4032,128,1783.088955,0.713697,1.894598,0.061959,0.836521,47.333333,126,4,55.72153,0.0,0.0,0.0,0.0,0.0,0,0,0.0,109071.666667,119975,95805,10007.871347,0.170889,0.211845,0.123142,0.03653,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.958577,1.982691,1.924671,0.024678,1.958577,1.982691,1.924671,0.024678,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,12.5,12.5,12.5,0.0,1.958577,1.982691,1.924671,0.024678,15.668612,15.861527,15.397365,0.197423,1024.0,1024,1024,32.0,32,32,0.0,0.0,0.0,0,0,0.0,2048.0,2048,2048,0.0,1024.0,1024,1024,0.0,704.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,704,704,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,...,288,66.459679,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,98.148148,100.0,97.222222,1.309457,100.0,100.0,100.0,0.0,1.958577,1.982691,1.924671,0.024678,128.0,128,128,0.0,97.916667,100.0,96.875,1.473139,15.668612,15.861527,15.397365,0.197423,1024.0,1024,1024,0.0,15.86753,16.062894,15.59284,0.199929,1037.0,1037,1037,0.0,192.0,192,192,0.0,384.0,384,384,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,170.666667,512,0,241.359115,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,4.181011,5.859437,3.139082,1.198312,56.213196,59.288673,50.263733,4.20771,8.759934,9.223832,7.868279,0.630668,9.505361,19.816407,4.34545,7.291011,19.527162,20.784367,17.176162,1.663746,2.197374,2.331154,1.937928,0.183486,0.039014,0.041078,0.03497,0.00286,3.50176,3.916065,2.681043,0.580344,0.2562,0.286964,0.221477,0.026881,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,78.343061,79.307635,76.986826,0.987113,5.0,5,5,0.0,10.0,10.0,10.0,0.0,1.958577,1.982691,1.924671,0.024678,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,100.0,100.0,100.0,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z17transposeDiagonalPfS_ii,218.0,16.0,16.0,1.0,2.186667,0.0,2.0,2.0,1.0,11.0,302188.099,1.0625,0.124061,0.124452,0.12371,0.000304,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,64.0,64,64,0.0,64.0,64,64,0.0,3136.0,3456,2560,408.130698,1.502471,1.659098,1.220781,0.199602,98.0,108,80,12.754084,170.666667,384,0,159.644049,0.081899,0.184249,0.0,0.076597,5.333333,12,0,4.988877,0.0,0.0,0.0,0.0,0.0,0,0,0.0,113356.666667,146565,95855,23493.269367,0.31203,0.348883,0.238694,0.051856,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,1024.0,1024,1024,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.961638,1.966339,1.95325,0.005946,1.961638,1.966339,1.95325,0.005946,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,100.0,100.0,100.0,0.0,1.961638,1.966339,1.95325,0.005946,1.961638,1.966339,1.95325,0.005946,128.0,128,128,4.0,4,4,0.0,0.0,2048.0,2048,2048,0.0,5120.0,5120,5120,0.0,2048.0,2048,2048,0.0,2208.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,2208,2208,0.0,0,0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,...,192,110.082797,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,75.0,100.0,50.0,20.412415,66.666667,100.0,0.0,47.140452,1.961638,1.966339,1.95325,0.005946,128.0,128,128,0.0,83.333333,100.0,50.0,23.570226,1.961638,1.966339,1.95325,0.005946,128.0,128,128,0.0,2.247874,2.425949,2.151627,0.126056,146.666667,158,141,8.013877,352.0,352,352,0.0,512.0,512,512,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0,0,0.0,170.666667,512,0,241.359115,50.0,50.0,50.0,0.0,3.923276,3.932678,3.9065,0.011891,64.0,64,64,2.0,2,2,0.0,0.0,3.923276,3.932678,3.9065,0.011891,64.0,64,64,2.0,2,2,0.0,0.0,7.830925,8.107297,7.56305,0.222269,24.419187,30.712378,16.6901,5.813915,12.507421,14.324394,11.435267,1.291725,39.367816,46.578793,25.004574,10.156374,15.168643,20.817021,7.689787,5.51326,0.051026,0.058542,0.046866,0.005325,0.242373,0.278073,0.222613,0.025292,3.186884,3.368483,2.86122,0.230789,0.398584,0.439062,0.351494,0.036054,4.658067,5.504738,4.162198,0.601609,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,78.465527,78.653551,78.13,0.237829,5.0,5,5,0.0,50.0,50.0,50.0,0.0,1.961638,1.966339,1.95325,0.005946,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,96.014493,96.014493,96.014493,0.0
7.0,1.0,NVIDIA GeForce GTX 1080,_Z17transposeDiagonalPfS_ii,220.0,16.0,16.0,1.0,1.962667,0.0,2.0,2.0,1.0,11.0,302193.368333,1.0625,0.12382,0.124047,0.123696,0.000161,0.0,0,0,0.0,0,0,0.0,0.0,100.0,100.0,100.0,0.0,64.0,64,64,0.0,64.0,64,64,0.0,21066.666667,61664,128,28711.405461,10.053411,29.420633,0.061575,13.697006,658.333333,1927,4,897.231421,128.0,256,0,104.511562,0.061239,0.122141,0.0,0.049864,4.0,8,0,3.265986,0.0,0.0,0.0,0.0,0.0,0,0,0.0,100730.0,105695,98210,3510.918683,0.420442,0.549803,0.238397,0.132477,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0,0,0.0,0,0,0.0,1024.0,1024,1024,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,100.0,100.0,100.0,0.0,1.965697,1.972439,1.954251,0.008136,1.965697,1.972439,1.954251,0.008136,514.0,514,514,16.0625,16.0625,16.0625,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,128.0,128,128,0.0,0.0,0,0,0.0,128.0,128,128,0.0,100.0,100.0,100.0,0.0,1.965697,1.972439,1.954251,0.008136,1.965697,1.972439,1.954251,0.008136,128.0,128,128,4.0,4,4,0.0,0.0,2048.0,2048,2048,0.0,5120.0,5120,5120,0.0,2048.0,2048,2048,0.0,2208.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,32.0,32,32,0.0,0.0,0,0,0.0,0.0,0,0,0.0,2208,2208,0.0,0,0,0.0,32.0,32,32,0.0,32.0,32,32,0.0,...,196,294.668552,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,63.020833,75.0,39.0625,16.9411,76.041667,100.0,28.125,33.8822,1.965697,1.972439,1.954251,0.008136,128.0,128,128,0.0,50.0,50.0,50.0,0.0,1.965697,1.972439,1.954251,0.008136,128.0,128,128,0.0,2.165338,2.172765,2.152729,0.008963,141.0,141,141,0.0,352.0,352,352,0.0,512.0,512,512,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0,0,0.0,0.0,170.666667,512,0,241.359115,341.333333,512,0,241.359115,50.0,50.0,50.0,0.0,3.931394,3.944878,3.908501,0.016273,64.0,64,64,2.0,2,2,0.0,0.0,3.931394,3.944878,3.908501,0.016273,64.0,64,64,2.0,2,2,0.0,0.0,4.727184,5.549346,4.217168,0.586942,23.311498,30.575849,17.401199,5.463085,12.018638,13.980805,10.068343,1.597278,37.620487,47.922497,24.330325,9.860508,16.426112,20.863773,8.334615,5.730494,0.049257,0.057298,0.041264,0.006546,0.313849,0.401089,0.196003,0.086478,5.379209,9.168076,2.965828,2.712433,0.369425,0.429738,0.309478,0.049097,4.511523,5.357399,3.77305,0.651251,0.0,0.0,0.0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0,0,0.0,0.0,0.0,0.0,0.0,0.0,0,0,0.0,160.0,160,160,0.0,78.627883,78.897565,78.170026,0.325459,5.0,5,5,0.0,50.0,50.0,50.0,0.0,1.965697,1.972439,1.954251,0.008136,128.0,128,128,0.0,0.0,0,0,0.0,32.0,32,32,0.0,100.0,100.0,100.0,0.0,96.014493,96.014493,96.014493,0.0


In [37]:
all_bench_configs = []

for (sim_name, sim), (config_name, config), (bench_name, bench) in itertools.product(
    selected_simulators.items(),
    selected_configs.items(),
    selected_benchmarks.items()
):
    if not bench.enabled(sim):
        continue
    
    # for inp in bench:
    #all_plot_configs.append(BenchmarkPlot(bench_config=sim(
    #    run_dir=run_dir / sim_name.lower(),
    #    benchmark=bench,
    #    config=config,
    #)))

print(f"{len(all_bench_configs)} total benchmark configs")

0 total benchmark configs


In [14]:
for plot_config in all_bench_configs:
    for inp in plot_config.bench_config.benchmark.inputs:
        hw_df = plot.load_hardware_df(inp)
        hw_df = plot.load_hardware_df(inp)
        accel_sass_df = pd.read_csv(accel_sass_results / "results/stats.csv")
print("accel sass shape", accel_sass_df.shape)
accel_sass_df = accel_sass_df.pivot(index=["kernel", "kernel_id"], columns=["stat"])["value"]
print("accel sass shape", accel_sass_df.shape)
# pprint(accel_df.columns.tolist())
accel_sass_df.T
        break
    break
hw_df.T
# plot = all_bench_configs[0]

kernels shape (1, 11)
cycles shape (1, 592)
inner join shape (1, 603)


Stream,7.0
Context,1.0
Device,NVIDIA GeForce GTX 1080 (0)
Kernel,_Z6vecAddPdS_S_i
Correlation_ID,112.0
Block X,1024.0
Block Y,1.0
Block Z,1.0
Duration,3.626667
Dynamic SMem,0.0
...,...
warp_execution_efficiency_std,0.0
warp_nonpred_execution_efficiency,94.327446
warp_nonpred_execution_efficiency_max,94.327446
warp_nonpred_execution_efficiency_min,94.327446


In [11]:
plot = all_bench_configs[0]
hw_df = plot.load_hardware_df()

NameError: name 'pd' is not defined

In [None]:
hw_df = build_hw_df(
    cycle_csv_files=list((native_results / "results").rglob(r"result.cycles.csv.*")),
    kernel_csv_files=list((native_results / "results").rglob(r"result.csv.*")),
)
hw_df.T