├── .gitignore ├── LICENSE ├── MeasurementSeries.hpp ├── README.md ├── cuda-incore ├── Makefile └── main.cu ├── cuda-memcpy ├── Makefile └── main.cu ├── device_order.py ├── dtime.hpp ├── gpu-cache ├── Makefile ├── a100_80.txt ├── a40.txt ├── cuda-cache-l2.svg ├── cuda-cache.svg ├── l40.txt ├── main.cu ├── mi100.txt ├── mi210.txt ├── mi300x.txt ├── plot.py ├── rx6900xt.txt └── v100.txt ├── gpu-clock.cuh ├── gpu-error.h ├── gpu-l2-cache ├── Makefile ├── a100_80.txt ├── cuda-cache.svg ├── h100_pcie.txt ├── h200.txt ├── l40.txt ├── main.cu ├── mi100.txt ├── mi210.txt ├── plot.py ├── rx6900xt.txt └── sycl │ ├── build.sh │ └── sycl-gpu-l2-cache.cpp ├── gpu-l2-stream ├── Makefile ├── a100_80.txt ├── a40.txt ├── gh200.txt ├── l40.txt ├── main.cu ├── mi100.txt ├── mi210.txt ├── mi300a.txt ├── mi300x.txt ├── plot.py └── rx6900xt.txt ├── gpu-latency ├── Makefile ├── a100_80.txt ├── a40.txt ├── gh200.txt ├── l40.txt ├── latencies.pdf ├── latencies.svg ├── latencies_AMD.pdf ├── latencies_AMD.svg ├── latencies_NV.pdf ├── latencies_NV.svg ├── main.cu ├── mi100.txt ├── mi210.txt ├── mi300a.txt ├── mi300x.txt ├── plot.py ├── rx6900xt.txt └── v100.txt ├── gpu-metrics.hpp ├── gpu-metrics ├── README.md ├── cuda_metrics │ ├── Eval.hpp │ ├── Metric.hpp │ ├── Parser.h │ ├── Parser.hpp │ ├── ScopeExit.h │ ├── Utils.h │ ├── measureMetricPW.cpp │ ├── measureMetricPW.hpp │ └── pythonInterface.cpp ├── gpu-metrics.hpp └── rocm_metrics │ ├── Makefile │ ├── rocm_metrics.hpp │ ├── test_rocm_metrics │ ├── test_rocm_metrics.hip │ └── vectoradd_hip.cpp ├── gpu-roofline ├── L40_plot.pdf ├── Makefile ├── alex_a100_40.txt ├── alex_a40.txt ├── genoa_l40.txt ├── h200.txt ├── main.cu ├── mi300x.txt ├── plot.py └── series.sh ├── gpu-small-kernels ├── Makefile ├── a100_80.txt ├── a100_80_graph.txt ├── a100_80_gsync.txt ├── a40.txt ├── a40_graph.txt ├── a40_pt.txt ├── h200.txt ├── h200_graph.txt ├── h200_gsync.txt ├── h200_pt.txt ├── l40.txt ├── l40_graph.txt ├── l40_gsync.txt ├── l40_pt.txt ├── main.cu ├── mi210.txt ├── mi210_graph.txt ├── mi210_gsync.txt ├── mi210_pt.txt ├── plot.py ├── readme.md ├── repeated-stream.svg ├── rx6900xt.txt ├── rx6900xt_graph.txt ├── rx6900xt_gsync.txt └── rx6900xt_pt.txt ├── gpu-stats.h ├── gpu-stream ├── Makefile ├── a100_40.txt ├── a100_80.txt ├── a40.txt ├── cuda-stream.pdf ├── cuda-stream.svg ├── gh200.txt ├── h100_pcie.txt ├── l40.txt ├── main.cu ├── maxbars.pdf ├── maxbars.svg ├── mi100.txt ├── mi210.txt ├── mi300a.txt ├── mi300x.txt ├── minbars.pdf ├── minbars.svg ├── past_results │ ├── a100_40.txt │ └── h100_pcie.txt ├── plot.py ├── rx6900xt.txt └── v100.txt ├── gpu-strides ├── Makefile ├── a100.txt ├── a40.txt ├── h200.txt ├── l1plot.py ├── main.cu ├── mi210.txt └── rdna2.txt ├── measure_metric ├── Eval.hpp ├── Metric.hpp ├── Parser.h ├── Parser.hpp ├── ScopeExit.h ├── Utils.h ├── measureMetricPW.cpp ├── measureMetricPW.hpp └── pythonInterface.cpp ├── metrics.cuh ├── rocm-metrics └── rocm-metrics.hpp ├── um-stream ├── Makefile └── main.cu └── unmaintained ├── cuda-3d-stream ├── Makefile └── main.cu ├── cuda-busy ├── Makefile └── main.cu ├── cuda-cache-overlap ├── Makefile └── main.cu ├── cuda-cache-patterns └── cuda-cache-patterns.ipynb ├── cuda-gapped-stream ├── Makefile └── main.cu └── cuda-l1 └── cuda-l1.ipynb /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/LICENSE -------------------------------------------------------------------------------- /MeasurementSeries.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/MeasurementSeries.hpp -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/README.md -------------------------------------------------------------------------------- /cuda-incore/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/cuda-incore/Makefile -------------------------------------------------------------------------------- /cuda-incore/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/cuda-incore/main.cu -------------------------------------------------------------------------------- /cuda-memcpy/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/cuda-memcpy/Makefile -------------------------------------------------------------------------------- /cuda-memcpy/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/cuda-memcpy/main.cu -------------------------------------------------------------------------------- /device_order.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/device_order.py -------------------------------------------------------------------------------- /dtime.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/dtime.hpp -------------------------------------------------------------------------------- /gpu-cache/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/Makefile -------------------------------------------------------------------------------- /gpu-cache/a100_80.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/a100_80.txt -------------------------------------------------------------------------------- /gpu-cache/a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/a40.txt -------------------------------------------------------------------------------- /gpu-cache/cuda-cache-l2.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/cuda-cache-l2.svg -------------------------------------------------------------------------------- /gpu-cache/cuda-cache.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/cuda-cache.svg -------------------------------------------------------------------------------- /gpu-cache/l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/l40.txt -------------------------------------------------------------------------------- /gpu-cache/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/main.cu -------------------------------------------------------------------------------- /gpu-cache/mi100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/mi100.txt -------------------------------------------------------------------------------- /gpu-cache/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/mi210.txt -------------------------------------------------------------------------------- /gpu-cache/mi300x.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/mi300x.txt -------------------------------------------------------------------------------- /gpu-cache/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/plot.py -------------------------------------------------------------------------------- /gpu-cache/rx6900xt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/rx6900xt.txt -------------------------------------------------------------------------------- /gpu-cache/v100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-cache/v100.txt -------------------------------------------------------------------------------- /gpu-clock.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-clock.cuh -------------------------------------------------------------------------------- /gpu-error.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-error.h -------------------------------------------------------------------------------- /gpu-l2-cache/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/Makefile -------------------------------------------------------------------------------- /gpu-l2-cache/a100_80.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/a100_80.txt -------------------------------------------------------------------------------- /gpu-l2-cache/cuda-cache.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/cuda-cache.svg -------------------------------------------------------------------------------- /gpu-l2-cache/h100_pcie.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/h100_pcie.txt -------------------------------------------------------------------------------- /gpu-l2-cache/h200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/h200.txt -------------------------------------------------------------------------------- /gpu-l2-cache/l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/l40.txt -------------------------------------------------------------------------------- /gpu-l2-cache/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/main.cu -------------------------------------------------------------------------------- /gpu-l2-cache/mi100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/mi100.txt -------------------------------------------------------------------------------- /gpu-l2-cache/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/mi210.txt -------------------------------------------------------------------------------- /gpu-l2-cache/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/plot.py -------------------------------------------------------------------------------- /gpu-l2-cache/rx6900xt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/rx6900xt.txt -------------------------------------------------------------------------------- /gpu-l2-cache/sycl/build.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/sycl/build.sh -------------------------------------------------------------------------------- /gpu-l2-cache/sycl/sycl-gpu-l2-cache.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-cache/sycl/sycl-gpu-l2-cache.cpp -------------------------------------------------------------------------------- /gpu-l2-stream/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/Makefile -------------------------------------------------------------------------------- /gpu-l2-stream/a100_80.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/a100_80.txt -------------------------------------------------------------------------------- /gpu-l2-stream/a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/a40.txt -------------------------------------------------------------------------------- /gpu-l2-stream/gh200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/gh200.txt -------------------------------------------------------------------------------- /gpu-l2-stream/l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/l40.txt -------------------------------------------------------------------------------- /gpu-l2-stream/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/main.cu -------------------------------------------------------------------------------- /gpu-l2-stream/mi100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/mi100.txt -------------------------------------------------------------------------------- /gpu-l2-stream/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/mi210.txt -------------------------------------------------------------------------------- /gpu-l2-stream/mi300a.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/mi300a.txt -------------------------------------------------------------------------------- /gpu-l2-stream/mi300x.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/mi300x.txt -------------------------------------------------------------------------------- /gpu-l2-stream/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/plot.py -------------------------------------------------------------------------------- /gpu-l2-stream/rx6900xt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-l2-stream/rx6900xt.txt -------------------------------------------------------------------------------- /gpu-latency/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/Makefile -------------------------------------------------------------------------------- /gpu-latency/a100_80.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/a100_80.txt -------------------------------------------------------------------------------- /gpu-latency/a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/a40.txt -------------------------------------------------------------------------------- /gpu-latency/gh200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/gh200.txt -------------------------------------------------------------------------------- /gpu-latency/l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/l40.txt -------------------------------------------------------------------------------- /gpu-latency/latencies.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/latencies.pdf -------------------------------------------------------------------------------- /gpu-latency/latencies.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/latencies.svg -------------------------------------------------------------------------------- /gpu-latency/latencies_AMD.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/latencies_AMD.pdf -------------------------------------------------------------------------------- /gpu-latency/latencies_AMD.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/latencies_AMD.svg -------------------------------------------------------------------------------- /gpu-latency/latencies_NV.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/latencies_NV.pdf -------------------------------------------------------------------------------- /gpu-latency/latencies_NV.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/latencies_NV.svg -------------------------------------------------------------------------------- /gpu-latency/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/main.cu -------------------------------------------------------------------------------- /gpu-latency/mi100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/mi100.txt -------------------------------------------------------------------------------- /gpu-latency/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/mi210.txt -------------------------------------------------------------------------------- /gpu-latency/mi300a.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/mi300a.txt -------------------------------------------------------------------------------- /gpu-latency/mi300x.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/mi300x.txt -------------------------------------------------------------------------------- /gpu-latency/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/plot.py -------------------------------------------------------------------------------- /gpu-latency/rx6900xt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/rx6900xt.txt -------------------------------------------------------------------------------- /gpu-latency/v100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-latency/v100.txt -------------------------------------------------------------------------------- /gpu-metrics.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics.hpp -------------------------------------------------------------------------------- /gpu-metrics/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/README.md -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/Eval.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/Eval.hpp -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/Metric.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/Metric.hpp -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/Parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/Parser.h -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/Parser.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/Parser.hpp -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/ScopeExit.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/ScopeExit.h -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/Utils.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/Utils.h -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/measureMetricPW.cpp: -------------------------------------------------------------------------------- 1 | #include "measureMetricPW.hpp" 2 | -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/measureMetricPW.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/measureMetricPW.hpp -------------------------------------------------------------------------------- /gpu-metrics/cuda_metrics/pythonInterface.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/cuda_metrics/pythonInterface.cpp -------------------------------------------------------------------------------- /gpu-metrics/gpu-metrics.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/gpu-metrics.hpp -------------------------------------------------------------------------------- /gpu-metrics/rocm_metrics/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/rocm_metrics/Makefile -------------------------------------------------------------------------------- /gpu-metrics/rocm_metrics/rocm_metrics.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/rocm_metrics/rocm_metrics.hpp -------------------------------------------------------------------------------- /gpu-metrics/rocm_metrics/test_rocm_metrics: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/rocm_metrics/test_rocm_metrics -------------------------------------------------------------------------------- /gpu-metrics/rocm_metrics/test_rocm_metrics.hip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/rocm_metrics/test_rocm_metrics.hip -------------------------------------------------------------------------------- /gpu-metrics/rocm_metrics/vectoradd_hip.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-metrics/rocm_metrics/vectoradd_hip.cpp -------------------------------------------------------------------------------- /gpu-roofline/L40_plot.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/L40_plot.pdf -------------------------------------------------------------------------------- /gpu-roofline/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/Makefile -------------------------------------------------------------------------------- /gpu-roofline/alex_a100_40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/alex_a100_40.txt -------------------------------------------------------------------------------- /gpu-roofline/alex_a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/alex_a40.txt -------------------------------------------------------------------------------- /gpu-roofline/genoa_l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/genoa_l40.txt -------------------------------------------------------------------------------- /gpu-roofline/h200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/h200.txt -------------------------------------------------------------------------------- /gpu-roofline/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/main.cu -------------------------------------------------------------------------------- /gpu-roofline/mi300x.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/mi300x.txt -------------------------------------------------------------------------------- /gpu-roofline/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/plot.py -------------------------------------------------------------------------------- /gpu-roofline/series.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-roofline/series.sh -------------------------------------------------------------------------------- /gpu-small-kernels/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/Makefile -------------------------------------------------------------------------------- /gpu-small-kernels/a100_80.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/a100_80.txt -------------------------------------------------------------------------------- /gpu-small-kernels/a100_80_graph.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/a100_80_graph.txt -------------------------------------------------------------------------------- /gpu-small-kernels/a100_80_gsync.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/a100_80_gsync.txt -------------------------------------------------------------------------------- /gpu-small-kernels/a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/a40.txt -------------------------------------------------------------------------------- /gpu-small-kernels/a40_graph.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/a40_graph.txt -------------------------------------------------------------------------------- /gpu-small-kernels/a40_pt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/a40_pt.txt -------------------------------------------------------------------------------- /gpu-small-kernels/h200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/h200.txt -------------------------------------------------------------------------------- /gpu-small-kernels/h200_graph.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/h200_graph.txt -------------------------------------------------------------------------------- /gpu-small-kernels/h200_gsync.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/h200_gsync.txt -------------------------------------------------------------------------------- /gpu-small-kernels/h200_pt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/h200_pt.txt -------------------------------------------------------------------------------- /gpu-small-kernels/l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/l40.txt -------------------------------------------------------------------------------- /gpu-small-kernels/l40_graph.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/l40_graph.txt -------------------------------------------------------------------------------- /gpu-small-kernels/l40_gsync.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/l40_gsync.txt -------------------------------------------------------------------------------- /gpu-small-kernels/l40_pt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/l40_pt.txt -------------------------------------------------------------------------------- /gpu-small-kernels/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/main.cu -------------------------------------------------------------------------------- /gpu-small-kernels/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/mi210.txt -------------------------------------------------------------------------------- /gpu-small-kernels/mi210_graph.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/mi210_graph.txt -------------------------------------------------------------------------------- /gpu-small-kernels/mi210_gsync.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/mi210_gsync.txt -------------------------------------------------------------------------------- /gpu-small-kernels/mi210_pt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/mi210_pt.txt -------------------------------------------------------------------------------- /gpu-small-kernels/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/plot.py -------------------------------------------------------------------------------- /gpu-small-kernels/readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/readme.md -------------------------------------------------------------------------------- /gpu-small-kernels/repeated-stream.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/repeated-stream.svg -------------------------------------------------------------------------------- /gpu-small-kernels/rx6900xt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/rx6900xt.txt -------------------------------------------------------------------------------- /gpu-small-kernels/rx6900xt_graph.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/rx6900xt_graph.txt -------------------------------------------------------------------------------- /gpu-small-kernels/rx6900xt_gsync.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/rx6900xt_gsync.txt -------------------------------------------------------------------------------- /gpu-small-kernels/rx6900xt_pt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-small-kernels/rx6900xt_pt.txt -------------------------------------------------------------------------------- /gpu-stats.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stats.h -------------------------------------------------------------------------------- /gpu-stream/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/Makefile -------------------------------------------------------------------------------- /gpu-stream/a100_40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/a100_40.txt -------------------------------------------------------------------------------- /gpu-stream/a100_80.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/a100_80.txt -------------------------------------------------------------------------------- /gpu-stream/a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/a40.txt -------------------------------------------------------------------------------- /gpu-stream/cuda-stream.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/cuda-stream.pdf -------------------------------------------------------------------------------- /gpu-stream/cuda-stream.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/cuda-stream.svg -------------------------------------------------------------------------------- /gpu-stream/gh200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/gh200.txt -------------------------------------------------------------------------------- /gpu-stream/h100_pcie.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/h100_pcie.txt -------------------------------------------------------------------------------- /gpu-stream/l40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/l40.txt -------------------------------------------------------------------------------- /gpu-stream/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/main.cu -------------------------------------------------------------------------------- /gpu-stream/maxbars.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/maxbars.pdf -------------------------------------------------------------------------------- /gpu-stream/maxbars.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/maxbars.svg -------------------------------------------------------------------------------- /gpu-stream/mi100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/mi100.txt -------------------------------------------------------------------------------- /gpu-stream/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/mi210.txt -------------------------------------------------------------------------------- /gpu-stream/mi300a.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/mi300a.txt -------------------------------------------------------------------------------- /gpu-stream/mi300x.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/mi300x.txt -------------------------------------------------------------------------------- /gpu-stream/minbars.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/minbars.pdf -------------------------------------------------------------------------------- /gpu-stream/minbars.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/minbars.svg -------------------------------------------------------------------------------- /gpu-stream/past_results/a100_40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/past_results/a100_40.txt -------------------------------------------------------------------------------- /gpu-stream/past_results/h100_pcie.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/past_results/h100_pcie.txt -------------------------------------------------------------------------------- /gpu-stream/plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/plot.py -------------------------------------------------------------------------------- /gpu-stream/rx6900xt.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/rx6900xt.txt -------------------------------------------------------------------------------- /gpu-stream/v100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-stream/v100.txt -------------------------------------------------------------------------------- /gpu-strides/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/Makefile -------------------------------------------------------------------------------- /gpu-strides/a100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/a100.txt -------------------------------------------------------------------------------- /gpu-strides/a40.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/a40.txt -------------------------------------------------------------------------------- /gpu-strides/h200.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/h200.txt -------------------------------------------------------------------------------- /gpu-strides/l1plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/l1plot.py -------------------------------------------------------------------------------- /gpu-strides/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/main.cu -------------------------------------------------------------------------------- /gpu-strides/mi210.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/mi210.txt -------------------------------------------------------------------------------- /gpu-strides/rdna2.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/gpu-strides/rdna2.txt -------------------------------------------------------------------------------- /measure_metric/Eval.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/Eval.hpp -------------------------------------------------------------------------------- /measure_metric/Metric.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/Metric.hpp -------------------------------------------------------------------------------- /measure_metric/Parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/Parser.h -------------------------------------------------------------------------------- /measure_metric/Parser.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/Parser.hpp -------------------------------------------------------------------------------- /measure_metric/ScopeExit.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/ScopeExit.h -------------------------------------------------------------------------------- /measure_metric/Utils.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/Utils.h -------------------------------------------------------------------------------- /measure_metric/measureMetricPW.cpp: -------------------------------------------------------------------------------- 1 | #include "measureMetricPW.hpp" 2 | -------------------------------------------------------------------------------- /measure_metric/measureMetricPW.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/measureMetricPW.hpp -------------------------------------------------------------------------------- /measure_metric/pythonInterface.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/measure_metric/pythonInterface.cpp -------------------------------------------------------------------------------- /metrics.cuh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/metrics.cuh -------------------------------------------------------------------------------- /rocm-metrics/rocm-metrics.hpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/rocm-metrics/rocm-metrics.hpp -------------------------------------------------------------------------------- /um-stream/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/um-stream/Makefile -------------------------------------------------------------------------------- /um-stream/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/um-stream/main.cu -------------------------------------------------------------------------------- /unmaintained/cuda-3d-stream/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-3d-stream/Makefile -------------------------------------------------------------------------------- /unmaintained/cuda-3d-stream/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-3d-stream/main.cu -------------------------------------------------------------------------------- /unmaintained/cuda-busy/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-busy/Makefile -------------------------------------------------------------------------------- /unmaintained/cuda-busy/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-busy/main.cu -------------------------------------------------------------------------------- /unmaintained/cuda-cache-overlap/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-cache-overlap/Makefile -------------------------------------------------------------------------------- /unmaintained/cuda-cache-overlap/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-cache-overlap/main.cu -------------------------------------------------------------------------------- /unmaintained/cuda-cache-patterns/cuda-cache-patterns.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-cache-patterns/cuda-cache-patterns.ipynb -------------------------------------------------------------------------------- /unmaintained/cuda-gapped-stream/Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-gapped-stream/Makefile -------------------------------------------------------------------------------- /unmaintained/cuda-gapped-stream/main.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-gapped-stream/main.cu -------------------------------------------------------------------------------- /unmaintained/cuda-l1/cuda-l1.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RRZE-HPC/gpu-benches/HEAD/unmaintained/cuda-l1/cuda-l1.ipynb --------------------------------------------------------------------------------