├── .gitignore ├── .vscode └── settings.json ├── LICENSE.txt ├── README.md ├── assets ├── benchmark_comparison.png ├── header.png └── table.png ├── benchmarking_offline.py ├── benchmarking_server.py ├── benchmarking_utils.py ├── compile.py ├── cublas ├── hgemm_cublas.cu ├── hgemm_cublaslt_auto_tuning.cu └── hgemm_cublaslt_heuristic.cu ├── eval_one_file.sh ├── eval_results ├── cuda_l2_a100_F16F16F16F16_speedup_offline.csv └── cuda_l2_a100_F16F16F16F16_speedup_server.csv ├── kernels └── a100_F16F16F16F16 │ ├── 1024_1024_1024.cu │ ├── 1024_1024_12288.cu │ ├── 1024_1024_128.cu │ ├── 1024_1024_16384.cu │ ├── 1024_1024_2048.cu │ ├── 1024_1024_256.cu │ ├── 1024_1024_4096.cu │ ├── 1024_1024_512.cu │ ├── 1024_1024_64.cu │ ├── 1024_1024_8192.cu │ ├── 1024_12288_1024.cu │ ├── 1024_12288_12288.cu │ ├── 1024_12288_128.cu │ ├── 1024_12288_16384.cu │ ├── 1024_12288_2048.cu │ ├── 1024_12288_256.cu │ ├── 1024_12288_4096.cu │ ├── 1024_12288_512.cu │ ├── 1024_12288_64.cu │ ├── 1024_12288_8192.cu │ ├── 1024_128_1024.cu │ ├── 1024_128_12288.cu │ ├── 1024_128_128.cu │ ├── 1024_128_16384.cu │ ├── 1024_128_2048.cu │ ├── 1024_128_256.cu │ ├── 1024_128_4096.cu │ ├── 1024_128_512.cu │ ├── 1024_128_64.cu │ ├── 1024_128_8192.cu │ ├── 1024_16384_1024.cu │ ├── 1024_16384_12288.cu │ ├── 1024_16384_128.cu │ ├── 1024_16384_16384.cu │ ├── 1024_16384_2048.cu │ ├── 1024_16384_256.cu │ ├── 1024_16384_4096.cu │ ├── 1024_16384_512.cu │ ├── 1024_16384_64.cu │ ├── 1024_16384_8192.cu │ ├── 1024_2048_1024.cu │ ├── 1024_2048_12288.cu │ ├── 1024_2048_128.cu │ ├── 1024_2048_16384.cu │ ├── 1024_2048_2048.cu │ ├── 1024_2048_256.cu │ ├── 1024_2048_4096.cu │ ├── 1024_2048_512.cu │ ├── 1024_2048_64.cu │ ├── 1024_2048_8192.cu │ ├── 1024_256_1024.cu │ ├── 1024_256_12288.cu │ ├── 1024_256_128.cu │ ├── 1024_256_16384.cu │ ├── 1024_256_2048.cu │ ├── 1024_256_256.cu │ ├── 1024_256_4096.cu │ ├── 1024_256_512.cu │ ├── 1024_256_64.cu │ ├── 1024_256_8192.cu │ ├── 1024_4096_1024.cu │ ├── 1024_4096_12288.cu │ ├── 1024_4096_128.cu │ ├── 1024_4096_16384.cu │ ├── 1024_4096_2048.cu │ ├── 1024_4096_256.cu │ ├── 1024_4096_4096.cu │ ├── 1024_4096_512.cu │ ├── 1024_4096_64.cu │ ├── 1024_4096_8192.cu │ ├── 1024_512_1024.cu │ ├── 1024_512_12288.cu │ ├── 1024_512_128.cu │ ├── 1024_512_16384.cu │ ├── 1024_512_2048.cu │ ├── 1024_512_256.cu │ ├── 1024_512_4096.cu │ ├── 1024_512_512.cu │ ├── 1024_512_64.cu │ ├── 1024_512_8192.cu │ ├── 1024_64_1024.cu │ ├── 1024_64_12288.cu │ ├── 1024_64_128.cu │ ├── 1024_64_16384.cu │ ├── 1024_64_2048.cu │ ├── 1024_64_256.cu │ ├── 1024_64_4096.cu │ ├── 1024_64_512.cu │ ├── 1024_64_64.cu │ ├── 1024_64_8192.cu │ ├── 1024_8192_1024.cu │ ├── 1024_8192_12288.cu │ ├── 1024_8192_128.cu │ ├── 1024_8192_16384.cu │ ├── 1024_8192_2048.cu │ ├── 1024_8192_256.cu │ ├── 1024_8192_4096.cu │ ├── 1024_8192_512.cu │ ├── 1024_8192_64.cu │ ├── 1024_8192_8192.cu │ ├── 12288_1024_1024.cu │ ├── 12288_1024_12288.cu │ ├── 12288_1024_128.cu │ ├── 12288_1024_16384.cu │ ├── 12288_1024_2048.cu │ ├── 12288_1024_256.cu │ ├── 12288_1024_4096.cu │ ├── 12288_1024_512.cu │ ├── 12288_1024_64.cu │ ├── 12288_1024_8192.cu │ ├── 12288_12288_1024.cu │ ├── 12288_12288_12288.cu │ ├── 12288_12288_128.cu │ ├── 12288_12288_16384.cu │ ├── 12288_12288_2048.cu │ ├── 12288_12288_256.cu │ ├── 12288_12288_4096.cu │ ├── 12288_12288_512.cu │ ├── 12288_12288_64.cu │ ├── 12288_12288_8192.cu │ ├── 12288_128_1024.cu │ ├── 12288_128_12288.cu │ ├── 12288_128_128.cu │ ├── 12288_128_16384.cu │ ├── 12288_128_2048.cu │ ├── 12288_128_256.cu │ ├── 12288_128_4096.cu │ ├── 12288_128_512.cu │ ├── 12288_128_64.cu │ ├── 12288_128_8192.cu │ ├── 12288_16384_1024.cu │ ├── 12288_16384_12288.cu │ ├── 12288_16384_128.cu │ ├── 12288_16384_16384.cu │ ├── 12288_16384_2048.cu │ ├── 12288_16384_256.cu │ ├── 12288_16384_4096.cu │ ├── 12288_16384_512.cu │ ├── 12288_16384_64.cu │ ├── 12288_16384_8192.cu │ ├── 12288_2048_1024.cu │ ├── 12288_2048_12288.cu │ ├── 12288_2048_128.cu │ ├── 12288_2048_16384.cu │ ├── 12288_2048_2048.cu │ ├── 12288_2048_256.cu │ ├── 12288_2048_4096.cu │ ├── 12288_2048_512.cu │ ├── 12288_2048_64.cu │ ├── 12288_2048_8192.cu │ ├── 12288_256_1024.cu │ ├── 12288_256_12288.cu │ ├── 12288_256_128.cu │ ├── 12288_256_16384.cu │ ├── 12288_256_2048.cu │ ├── 12288_256_256.cu │ ├── 12288_256_4096.cu │ ├── 12288_256_512.cu │ ├── 12288_256_64.cu │ ├── 12288_256_8192.cu │ ├── 12288_4096_1024.cu │ ├── 12288_4096_12288.cu │ ├── 12288_4096_128.cu │ ├── 12288_4096_16384.cu │ ├── 12288_4096_2048.cu │ ├── 12288_4096_256.cu │ ├── 12288_4096_4096.cu │ ├── 12288_4096_512.cu │ ├── 12288_4096_64.cu │ ├── 12288_4096_8192.cu │ ├── 12288_512_1024.cu │ ├── 12288_512_12288.cu │ ├── 12288_512_128.cu │ ├── 12288_512_16384.cu │ ├── 12288_512_2048.cu │ ├── 12288_512_256.cu │ ├── 12288_512_4096.cu │ ├── 12288_512_512.cu │ ├── 12288_512_64.cu │ ├── 12288_512_8192.cu │ ├── 12288_64_1024.cu │ ├── 12288_64_12288.cu │ ├── 12288_64_128.cu │ ├── 12288_64_16384.cu │ ├── 12288_64_2048.cu │ ├── 12288_64_256.cu │ ├── 12288_64_4096.cu │ ├── 12288_64_512.cu │ ├── 12288_64_64.cu │ ├── 12288_64_8192.cu │ ├── 12288_8192_1024.cu │ ├── 12288_8192_12288.cu │ ├── 12288_8192_128.cu │ ├── 12288_8192_16384.cu │ ├── 12288_8192_2048.cu │ ├── 12288_8192_256.cu │ ├── 12288_8192_4096.cu │ ├── 12288_8192_512.cu │ ├── 12288_8192_64.cu │ ├── 12288_8192_8192.cu │ ├── 128_1024_1024.cu │ ├── 128_1024_12288.cu │ ├── 128_1024_128.cu │ ├── 128_1024_16384.cu │ ├── 128_1024_2048.cu │ ├── 128_1024_256.cu │ ├── 128_1024_4096.cu │ ├── 128_1024_512.cu │ ├── 128_1024_64.cu │ ├── 128_1024_8192.cu │ ├── 128_12288_1024.cu │ ├── 128_12288_12288.cu │ ├── 128_12288_128.cu │ ├── 128_12288_16384.cu │ ├── 128_12288_2048.cu │ ├── 128_12288_256.cu │ ├── 128_12288_4096.cu │ ├── 128_12288_512.cu │ ├── 128_12288_64.cu │ ├── 128_12288_8192.cu │ ├── 128_128_1024.cu │ ├── 128_128_12288.cu │ ├── 128_128_128.cu │ ├── 128_128_16384.cu │ ├── 128_128_2048.cu │ ├── 128_128_256.cu │ ├── 128_128_4096.cu │ ├── 128_128_512.cu │ ├── 128_128_64.cu │ ├── 128_128_8192.cu │ ├── 128_16384_1024.cu │ ├── 128_16384_12288.cu │ ├── 128_16384_128.cu │ ├── 128_16384_16384.cu │ ├── 128_16384_2048.cu │ ├── 128_16384_256.cu │ ├── 128_16384_4096.cu │ ├── 128_16384_512.cu │ ├── 128_16384_64.cu │ ├── 128_16384_8192.cu │ ├── 128_2048_1024.cu │ ├── 128_2048_12288.cu │ ├── 128_2048_128.cu │ ├── 128_2048_16384.cu │ ├── 128_2048_2048.cu │ ├── 128_2048_256.cu │ ├── 128_2048_4096.cu │ ├── 128_2048_512.cu │ ├── 128_2048_64.cu │ ├── 128_2048_8192.cu │ ├── 128_256_1024.cu │ ├── 128_256_12288.cu │ ├── 128_256_128.cu │ ├── 128_256_16384.cu │ ├── 128_256_2048.cu │ ├── 128_256_256.cu │ ├── 128_256_4096.cu │ ├── 128_256_512.cu │ ├── 128_256_64.cu │ ├── 128_256_8192.cu │ ├── 128_4096_1024.cu │ ├── 128_4096_12288.cu │ ├── 128_4096_128.cu │ ├── 128_4096_16384.cu │ ├── 128_4096_2048.cu │ ├── 128_4096_256.cu │ ├── 128_4096_4096.cu │ ├── 128_4096_512.cu │ ├── 128_4096_64.cu │ ├── 128_4096_8192.cu │ ├── 128_512_1024.cu │ ├── 128_512_12288.cu │ ├── 128_512_128.cu │ ├── 128_512_16384.cu │ ├── 128_512_2048.cu │ ├── 128_512_256.cu │ ├── 128_512_4096.cu │ ├── 128_512_512.cu │ ├── 128_512_64.cu │ ├── 128_512_8192.cu │ ├── 128_64_1024.cu │ ├── 128_64_12288.cu │ ├── 128_64_128.cu │ ├── 128_64_16384.cu │ ├── 128_64_2048.cu │ ├── 128_64_256.cu │ ├── 128_64_4096.cu │ ├── 128_64_512.cu │ ├── 128_64_64.cu │ ├── 128_64_8192.cu │ ├── 128_8192_1024.cu │ ├── 128_8192_12288.cu │ ├── 128_8192_128.cu │ ├── 128_8192_16384.cu │ ├── 128_8192_2048.cu │ ├── 128_8192_256.cu │ ├── 128_8192_4096.cu │ ├── 128_8192_512.cu │ ├── 128_8192_64.cu │ ├── 128_8192_8192.cu │ ├── 16384_1024_1024.cu │ ├── 16384_1024_12288.cu │ ├── 16384_1024_128.cu │ ├── 16384_1024_16384.cu │ ├── 16384_1024_2048.cu │ ├── 16384_1024_256.cu │ ├── 16384_1024_4096.cu │ ├── 16384_1024_512.cu │ ├── 16384_1024_64.cu │ ├── 16384_1024_8192.cu │ ├── 16384_12288_1024.cu │ ├── 16384_12288_12288.cu │ ├── 16384_12288_128.cu │ ├── 16384_12288_16384.cu │ ├── 16384_12288_2048.cu │ ├── 16384_12288_256.cu │ ├── 16384_12288_4096.cu │ ├── 16384_12288_512.cu │ ├── 16384_12288_64.cu │ ├── 16384_12288_8192.cu │ ├── 16384_128_1024.cu │ ├── 16384_128_12288.cu │ ├── 16384_128_128.cu │ ├── 16384_128_16384.cu │ ├── 16384_128_2048.cu │ ├── 16384_128_256.cu │ ├── 16384_128_4096.cu │ ├── 16384_128_512.cu │ ├── 16384_128_64.cu │ ├── 16384_128_8192.cu │ ├── 16384_16384_1024.cu │ ├── 16384_16384_12288.cu │ ├── 16384_16384_128.cu │ ├── 16384_16384_16384.cu │ ├── 16384_16384_2048.cu │ ├── 16384_16384_256.cu │ ├── 16384_16384_4096.cu │ ├── 16384_16384_512.cu │ ├── 16384_16384_64.cu │ ├── 16384_16384_8192.cu │ ├── 16384_2048_1024.cu │ ├── 16384_2048_12288.cu │ ├── 16384_2048_128.cu │ ├── 16384_2048_16384.cu │ ├── 16384_2048_2048.cu │ ├── 16384_2048_256.cu │ ├── 16384_2048_4096.cu │ ├── 16384_2048_512.cu │ ├── 16384_2048_64.cu │ ├── 16384_2048_8192.cu │ ├── 16384_256_1024.cu │ ├── 16384_256_12288.cu │ ├── 16384_256_128.cu │ ├── 16384_256_16384.cu │ ├── 16384_256_2048.cu │ ├── 16384_256_256.cu │ ├── 16384_256_4096.cu │ ├── 16384_256_512.cu │ ├── 16384_256_64.cu │ ├── 16384_256_8192.cu │ ├── 16384_4096_1024.cu │ ├── 16384_4096_12288.cu │ ├── 16384_4096_128.cu │ ├── 16384_4096_16384.cu │ ├── 16384_4096_2048.cu │ ├── 16384_4096_256.cu │ ├── 16384_4096_4096.cu │ ├── 16384_4096_512.cu │ ├── 16384_4096_64.cu │ ├── 16384_4096_8192.cu │ ├── 16384_512_1024.cu │ ├── 16384_512_12288.cu │ ├── 16384_512_128.cu │ ├── 16384_512_16384.cu │ ├── 16384_512_2048.cu │ ├── 16384_512_256.cu │ ├── 16384_512_4096.cu │ ├── 16384_512_512.cu │ ├── 16384_512_64.cu │ ├── 16384_512_8192.cu │ ├── 16384_64_1024.cu │ ├── 16384_64_12288.cu │ ├── 16384_64_128.cu │ ├── 16384_64_16384.cu │ ├── 16384_64_2048.cu │ ├── 16384_64_256.cu │ ├── 16384_64_4096.cu │ ├── 16384_64_512.cu │ ├── 16384_64_64.cu │ ├── 16384_64_8192.cu │ ├── 16384_8192_1024.cu │ ├── 16384_8192_12288.cu │ ├── 16384_8192_128.cu │ ├── 16384_8192_16384.cu │ ├── 16384_8192_2048.cu │ ├── 16384_8192_256.cu │ ├── 16384_8192_4096.cu │ ├── 16384_8192_512.cu │ ├── 16384_8192_64.cu │ ├── 16384_8192_8192.cu │ ├── 2048_1024_1024.cu │ ├── 2048_1024_12288.cu │ ├── 2048_1024_128.cu │ ├── 2048_1024_16384.cu │ ├── 2048_1024_2048.cu │ ├── 2048_1024_256.cu │ ├── 2048_1024_4096.cu │ ├── 2048_1024_512.cu │ ├── 2048_1024_64.cu │ ├── 2048_1024_8192.cu │ ├── 2048_12288_1024.cu │ ├── 2048_12288_12288.cu │ ├── 2048_12288_128.cu │ ├── 2048_12288_16384.cu │ ├── 2048_12288_2048.cu │ ├── 2048_12288_256.cu │ ├── 2048_12288_4096.cu │ ├── 2048_12288_512.cu │ ├── 2048_12288_64.cu │ ├── 2048_12288_8192.cu │ ├── 2048_128_1024.cu │ ├── 2048_128_12288.cu │ ├── 2048_128_128.cu │ ├── 2048_128_16384.cu │ ├── 2048_128_2048.cu │ ├── 2048_128_256.cu │ ├── 2048_128_4096.cu │ ├── 2048_128_512.cu │ ├── 2048_128_64.cu │ ├── 2048_128_8192.cu │ ├── 2048_16384_1024.cu │ ├── 2048_16384_12288.cu │ ├── 2048_16384_128.cu │ ├── 2048_16384_16384.cu │ ├── 2048_16384_2048.cu │ ├── 2048_16384_256.cu │ ├── 2048_16384_4096.cu │ ├── 2048_16384_512.cu │ ├── 2048_16384_64.cu │ ├── 2048_16384_8192.cu │ ├── 2048_2048_1024.cu │ ├── 2048_2048_12288.cu │ ├── 2048_2048_128.cu │ ├── 2048_2048_16384.cu │ ├── 2048_2048_2048.cu │ ├── 2048_2048_256.cu │ ├── 2048_2048_4096.cu │ ├── 2048_2048_512.cu │ ├── 2048_2048_64.cu │ ├── 2048_2048_8192.cu │ ├── 2048_256_1024.cu │ ├── 2048_256_12288.cu │ ├── 2048_256_128.cu │ ├── 2048_256_16384.cu │ ├── 2048_256_2048.cu │ ├── 2048_256_256.cu │ ├── 2048_256_4096.cu │ ├── 2048_256_512.cu │ ├── 2048_256_64.cu │ ├── 2048_256_8192.cu │ ├── 2048_4096_1024.cu │ ├── 2048_4096_12288.cu │ ├── 2048_4096_128.cu │ ├── 2048_4096_16384.cu │ ├── 2048_4096_2048.cu │ ├── 2048_4096_256.cu │ ├── 2048_4096_4096.cu │ ├── 2048_4096_512.cu │ ├── 2048_4096_64.cu │ ├── 2048_4096_8192.cu │ ├── 2048_512_1024.cu │ ├── 2048_512_12288.cu │ ├── 2048_512_128.cu │ ├── 2048_512_16384.cu │ ├── 2048_512_2048.cu │ ├── 2048_512_256.cu │ ├── 2048_512_4096.cu │ ├── 2048_512_512.cu │ ├── 2048_512_64.cu │ ├── 2048_512_8192.cu │ ├── 2048_64_1024.cu │ ├── 2048_64_12288.cu │ ├── 2048_64_128.cu │ ├── 2048_64_16384.cu │ ├── 2048_64_2048.cu │ ├── 2048_64_256.cu │ ├── 2048_64_4096.cu │ ├── 2048_64_512.cu │ ├── 2048_64_64.cu │ ├── 2048_64_8192.cu │ ├── 2048_8192_1024.cu │ ├── 2048_8192_12288.cu │ ├── 2048_8192_128.cu │ ├── 2048_8192_16384.cu │ ├── 2048_8192_2048.cu │ ├── 2048_8192_256.cu │ ├── 2048_8192_4096.cu │ ├── 2048_8192_512.cu │ ├── 2048_8192_64.cu │ ├── 2048_8192_8192.cu │ ├── 256_1024_1024.cu │ ├── 256_1024_12288.cu │ ├── 256_1024_128.cu │ ├── 256_1024_16384.cu │ ├── 256_1024_2048.cu │ ├── 256_1024_256.cu │ ├── 256_1024_4096.cu │ ├── 256_1024_512.cu │ ├── 256_1024_64.cu │ ├── 256_1024_8192.cu │ ├── 256_12288_1024.cu │ ├── 256_12288_12288.cu │ ├── 256_12288_128.cu │ ├── 256_12288_16384.cu │ ├── 256_12288_2048.cu │ ├── 256_12288_256.cu │ ├── 256_12288_4096.cu │ ├── 256_12288_512.cu │ ├── 256_12288_64.cu │ ├── 256_12288_8192.cu │ ├── 256_128_1024.cu │ ├── 256_128_12288.cu │ ├── 256_128_128.cu │ ├── 256_128_16384.cu │ ├── 256_128_2048.cu │ ├── 256_128_256.cu │ ├── 256_128_4096.cu │ ├── 256_128_512.cu │ ├── 256_128_64.cu │ ├── 256_128_8192.cu │ ├── 256_16384_1024.cu │ ├── 256_16384_12288.cu │ ├── 256_16384_128.cu │ ├── 256_16384_16384.cu │ ├── 256_16384_2048.cu │ ├── 256_16384_256.cu │ ├── 256_16384_4096.cu │ ├── 256_16384_512.cu │ ├── 256_16384_64.cu │ ├── 256_16384_8192.cu │ ├── 256_2048_1024.cu │ ├── 256_2048_12288.cu │ ├── 256_2048_128.cu │ ├── 256_2048_16384.cu │ ├── 256_2048_2048.cu │ ├── 256_2048_256.cu │ ├── 256_2048_4096.cu │ ├── 256_2048_512.cu │ ├── 256_2048_64.cu │ ├── 256_2048_8192.cu │ ├── 256_256_1024.cu │ ├── 256_256_12288.cu │ ├── 256_256_128.cu │ ├── 256_256_16384.cu │ ├── 256_256_2048.cu │ ├── 256_256_256.cu │ ├── 256_256_4096.cu │ ├── 256_256_512.cu │ ├── 256_256_64.cu │ ├── 256_256_8192.cu │ ├── 256_4096_1024.cu │ ├── 256_4096_12288.cu │ ├── 256_4096_128.cu │ ├── 256_4096_16384.cu │ ├── 256_4096_2048.cu │ ├── 256_4096_256.cu │ ├── 256_4096_4096.cu │ ├── 256_4096_512.cu │ ├── 256_4096_64.cu │ ├── 256_4096_8192.cu │ ├── 256_512_1024.cu │ ├── 256_512_12288.cu │ ├── 256_512_128.cu │ ├── 256_512_16384.cu │ ├── 256_512_2048.cu │ ├── 256_512_256.cu │ ├── 256_512_4096.cu │ ├── 256_512_512.cu │ ├── 256_512_64.cu │ ├── 256_512_8192.cu │ ├── 256_64_1024.cu │ ├── 256_64_12288.cu │ ├── 256_64_128.cu │ ├── 256_64_16384.cu │ ├── 256_64_2048.cu │ ├── 256_64_256.cu │ ├── 256_64_4096.cu │ ├── 256_64_512.cu │ ├── 256_64_64.cu │ ├── 256_64_8192.cu │ ├── 256_8192_1024.cu │ ├── 256_8192_12288.cu │ ├── 256_8192_128.cu │ ├── 256_8192_16384.cu │ ├── 256_8192_2048.cu │ ├── 256_8192_256.cu │ ├── 256_8192_4096.cu │ ├── 256_8192_512.cu │ ├── 256_8192_64.cu │ ├── 256_8192_8192.cu │ ├── 4096_1024_1024.cu │ ├── 4096_1024_12288.cu │ ├── 4096_1024_128.cu │ ├── 4096_1024_16384.cu │ ├── 4096_1024_2048.cu │ ├── 4096_1024_256.cu │ ├── 4096_1024_4096.cu │ ├── 4096_1024_512.cu │ ├── 4096_1024_64.cu │ ├── 4096_1024_8192.cu │ ├── 4096_12288_1024.cu │ ├── 4096_12288_12288.cu │ ├── 4096_12288_128.cu │ ├── 4096_12288_16384.cu │ ├── 4096_12288_2048.cu │ ├── 4096_12288_256.cu │ ├── 4096_12288_4096.cu │ ├── 4096_12288_512.cu │ ├── 4096_12288_64.cu │ ├── 4096_12288_8192.cu │ ├── 4096_128_1024.cu │ ├── 4096_128_12288.cu │ ├── 4096_128_128.cu │ ├── 4096_128_16384.cu │ ├── 4096_128_2048.cu │ ├── 4096_128_256.cu │ ├── 4096_128_4096.cu │ ├── 4096_128_512.cu │ ├── 4096_128_64.cu │ ├── 4096_128_8192.cu │ ├── 4096_16384_1024.cu │ ├── 4096_16384_12288.cu │ ├── 4096_16384_128.cu │ ├── 4096_16384_16384.cu │ ├── 4096_16384_2048.cu │ ├── 4096_16384_256.cu │ ├── 4096_16384_4096.cu │ ├── 4096_16384_512.cu │ ├── 4096_16384_64.cu │ ├── 4096_16384_8192.cu │ ├── 4096_2048_1024.cu │ ├── 4096_2048_12288.cu │ ├── 4096_2048_128.cu │ ├── 4096_2048_16384.cu │ ├── 4096_2048_2048.cu │ ├── 4096_2048_256.cu │ ├── 4096_2048_4096.cu │ ├── 4096_2048_512.cu │ ├── 4096_2048_64.cu │ ├── 4096_2048_8192.cu │ ├── 4096_256_1024.cu │ ├── 4096_256_12288.cu │ ├── 4096_256_128.cu │ ├── 4096_256_16384.cu │ ├── 4096_256_2048.cu │ ├── 4096_256_256.cu │ ├── 4096_256_4096.cu │ ├── 4096_256_512.cu │ ├── 4096_256_64.cu │ ├── 4096_256_8192.cu │ ├── 4096_4096_1024.cu │ ├── 4096_4096_12288.cu │ ├── 4096_4096_128.cu │ ├── 4096_4096_16384.cu │ ├── 4096_4096_2048.cu │ ├── 4096_4096_256.cu │ ├── 4096_4096_4096.cu │ ├── 4096_4096_512.cu │ ├── 4096_4096_64.cu │ ├── 4096_4096_8192.cu │ ├── 4096_512_1024.cu │ ├── 4096_512_12288.cu │ ├── 4096_512_128.cu │ ├── 4096_512_16384.cu │ ├── 4096_512_2048.cu │ ├── 4096_512_256.cu │ ├── 4096_512_4096.cu │ ├── 4096_512_512.cu │ ├── 4096_512_64.cu │ ├── 4096_512_8192.cu │ ├── 4096_64_1024.cu │ ├── 4096_64_12288.cu │ ├── 4096_64_128.cu │ ├── 4096_64_16384.cu │ ├── 4096_64_2048.cu │ ├── 4096_64_256.cu │ ├── 4096_64_4096.cu │ ├── 4096_64_512.cu │ ├── 4096_64_64.cu │ ├── 4096_64_8192.cu │ ├── 4096_8192_1024.cu │ ├── 4096_8192_12288.cu │ ├── 4096_8192_128.cu │ ├── 4096_8192_16384.cu │ ├── 4096_8192_2048.cu │ ├── 4096_8192_256.cu │ ├── 4096_8192_4096.cu │ ├── 4096_8192_512.cu │ ├── 4096_8192_64.cu │ ├── 4096_8192_8192.cu │ ├── 512_1024_1024.cu │ ├── 512_1024_12288.cu │ ├── 512_1024_128.cu │ ├── 512_1024_16384.cu │ ├── 512_1024_2048.cu │ ├── 512_1024_256.cu │ ├── 512_1024_4096.cu │ ├── 512_1024_512.cu │ ├── 512_1024_64.cu │ ├── 512_1024_8192.cu │ ├── 512_12288_1024.cu │ ├── 512_12288_12288.cu │ ├── 512_12288_128.cu │ ├── 512_12288_16384.cu │ ├── 512_12288_2048.cu │ ├── 512_12288_256.cu │ ├── 512_12288_4096.cu │ ├── 512_12288_512.cu │ ├── 512_12288_64.cu │ ├── 512_12288_8192.cu │ ├── 512_128_1024.cu │ ├── 512_128_12288.cu │ ├── 512_128_128.cu │ ├── 512_128_16384.cu │ ├── 512_128_2048.cu │ ├── 512_128_256.cu │ ├── 512_128_4096.cu │ ├── 512_128_512.cu │ ├── 512_128_64.cu │ ├── 512_128_8192.cu │ ├── 512_16384_1024.cu │ ├── 512_16384_12288.cu │ ├── 512_16384_128.cu │ ├── 512_16384_16384.cu │ ├── 512_16384_2048.cu │ ├── 512_16384_256.cu │ ├── 512_16384_4096.cu │ ├── 512_16384_512.cu │ ├── 512_16384_64.cu │ ├── 512_16384_8192.cu │ ├── 512_2048_1024.cu │ ├── 512_2048_12288.cu │ ├── 512_2048_128.cu │ ├── 512_2048_16384.cu │ ├── 512_2048_2048.cu │ ├── 512_2048_256.cu │ ├── 512_2048_4096.cu │ ├── 512_2048_512.cu │ ├── 512_2048_64.cu │ ├── 512_2048_8192.cu │ ├── 512_256_1024.cu │ ├── 512_256_12288.cu │ ├── 512_256_128.cu │ ├── 512_256_16384.cu │ ├── 512_256_2048.cu │ ├── 512_256_256.cu │ ├── 512_256_4096.cu │ ├── 512_256_512.cu │ ├── 512_256_64.cu │ ├── 512_256_8192.cu │ ├── 512_4096_1024.cu │ ├── 512_4096_12288.cu │ ├── 512_4096_128.cu │ ├── 512_4096_16384.cu │ ├── 512_4096_2048.cu │ ├── 512_4096_256.cu │ ├── 512_4096_4096.cu │ ├── 512_4096_512.cu │ ├── 512_4096_64.cu │ ├── 512_4096_8192.cu │ ├── 512_512_1024.cu │ ├── 512_512_12288.cu │ ├── 512_512_128.cu │ ├── 512_512_16384.cu │ ├── 512_512_2048.cu │ ├── 512_512_256.cu │ ├── 512_512_4096.cu │ ├── 512_512_512.cu │ ├── 512_512_64.cu │ ├── 512_512_8192.cu │ ├── 512_64_1024.cu │ ├── 512_64_12288.cu │ ├── 512_64_128.cu │ ├── 512_64_16384.cu │ ├── 512_64_2048.cu │ ├── 512_64_256.cu │ ├── 512_64_4096.cu │ ├── 512_64_512.cu │ ├── 512_64_64.cu │ ├── 512_64_8192.cu │ ├── 512_8192_1024.cu │ ├── 512_8192_12288.cu │ ├── 512_8192_128.cu │ ├── 512_8192_16384.cu │ ├── 512_8192_2048.cu │ ├── 512_8192_256.cu │ ├── 512_8192_4096.cu │ ├── 512_8192_512.cu │ ├── 512_8192_64.cu │ ├── 512_8192_8192.cu │ ├── 64_1024_1024.cu │ ├── 64_1024_12288.cu │ ├── 64_1024_128.cu │ ├── 64_1024_16384.cu │ ├── 64_1024_2048.cu │ ├── 64_1024_256.cu │ ├── 64_1024_4096.cu │ ├── 64_1024_512.cu │ ├── 64_1024_64.cu │ ├── 64_1024_8192.cu │ ├── 64_12288_1024.cu │ ├── 64_12288_12288.cu │ ├── 64_12288_128.cu │ ├── 64_12288_16384.cu │ ├── 64_12288_2048.cu │ ├── 64_12288_256.cu │ ├── 64_12288_4096.cu │ ├── 64_12288_512.cu │ ├── 64_12288_64.cu │ ├── 64_12288_8192.cu │ ├── 64_128_1024.cu │ ├── 64_128_12288.cu │ ├── 64_128_128.cu │ ├── 64_128_16384.cu │ ├── 64_128_2048.cu │ ├── 64_128_256.cu │ ├── 64_128_4096.cu │ ├── 64_128_512.cu │ ├── 64_128_64.cu │ ├── 64_128_8192.cu │ ├── 64_16384_1024.cu │ ├── 64_16384_12288.cu │ ├── 64_16384_128.cu │ ├── 64_16384_16384.cu │ ├── 64_16384_2048.cu │ ├── 64_16384_256.cu │ ├── 64_16384_4096.cu │ ├── 64_16384_512.cu │ ├── 64_16384_64.cu │ ├── 64_16384_8192.cu │ ├── 64_2048_1024.cu │ ├── 64_2048_12288.cu │ ├── 64_2048_128.cu │ ├── 64_2048_16384.cu │ ├── 64_2048_2048.cu │ ├── 64_2048_256.cu │ ├── 64_2048_4096.cu │ ├── 64_2048_512.cu │ ├── 64_2048_64.cu │ ├── 64_2048_8192.cu │ ├── 64_256_1024.cu │ ├── 64_256_12288.cu │ ├── 64_256_128.cu │ ├── 64_256_16384.cu │ ├── 64_256_2048.cu │ ├── 64_256_256.cu │ ├── 64_256_4096.cu │ ├── 64_256_512.cu │ ├── 64_256_64.cu │ ├── 64_256_8192.cu │ ├── 64_4096_1024.cu │ ├── 64_4096_12288.cu │ ├── 64_4096_128.cu │ ├── 64_4096_16384.cu │ ├── 64_4096_2048.cu │ ├── 64_4096_256.cu │ ├── 64_4096_4096.cu │ ├── 64_4096_512.cu │ ├── 64_4096_64.cu │ ├── 64_4096_8192.cu │ ├── 64_512_1024.cu │ ├── 64_512_12288.cu │ ├── 64_512_128.cu │ ├── 64_512_16384.cu │ ├── 64_512_2048.cu │ ├── 64_512_256.cu │ ├── 64_512_4096.cu │ ├── 64_512_512.cu │ ├── 64_512_64.cu │ ├── 64_512_8192.cu │ ├── 64_64_1024.cu │ ├── 64_64_12288.cu │ ├── 64_64_128.cu │ ├── 64_64_16384.cu │ ├── 64_64_2048.cu │ ├── 64_64_256.cu │ ├── 64_64_4096.cu │ ├── 64_64_512.cu │ ├── 64_64_64.cu │ ├── 64_64_8192.cu │ ├── 64_8192_1024.cu │ ├── 64_8192_12288.cu │ ├── 64_8192_128.cu │ ├── 64_8192_16384.cu │ ├── 64_8192_2048.cu │ ├── 64_8192_256.cu │ ├── 64_8192_4096.cu │ ├── 64_8192_512.cu │ ├── 64_8192_64.cu │ ├── 64_8192_8192.cu │ ├── 8192_1024_1024.cu │ ├── 8192_1024_12288.cu │ ├── 8192_1024_128.cu │ ├── 8192_1024_16384.cu │ ├── 8192_1024_2048.cu │ ├── 8192_1024_256.cu │ ├── 8192_1024_4096.cu │ ├── 8192_1024_512.cu │ ├── 8192_1024_64.cu │ ├── 8192_1024_8192.cu │ ├── 8192_12288_1024.cu │ ├── 8192_12288_12288.cu │ ├── 8192_12288_128.cu │ ├── 8192_12288_16384.cu │ ├── 8192_12288_2048.cu │ ├── 8192_12288_256.cu │ ├── 8192_12288_4096.cu │ ├── 8192_12288_512.cu │ ├── 8192_12288_64.cu │ ├── 8192_12288_8192.cu │ ├── 8192_128_1024.cu │ ├── 8192_128_12288.cu │ ├── 8192_128_128.cu │ ├── 8192_128_16384.cu │ ├── 8192_128_2048.cu │ ├── 8192_128_256.cu │ ├── 8192_128_4096.cu │ ├── 8192_128_512.cu │ ├── 8192_128_64.cu │ ├── 8192_128_8192.cu │ ├── 8192_16384_1024.cu │ ├── 8192_16384_12288.cu │ ├── 8192_16384_128.cu │ ├── 8192_16384_16384.cu │ ├── 8192_16384_2048.cu │ ├── 8192_16384_256.cu │ ├── 8192_16384_4096.cu │ ├── 8192_16384_512.cu │ ├── 8192_16384_64.cu │ ├── 8192_16384_8192.cu │ ├── 8192_2048_1024.cu │ ├── 8192_2048_12288.cu │ ├── 8192_2048_128.cu │ ├── 8192_2048_16384.cu │ ├── 8192_2048_2048.cu │ ├── 8192_2048_256.cu │ ├── 8192_2048_4096.cu │ ├── 8192_2048_512.cu │ ├── 8192_2048_64.cu │ ├── 8192_2048_8192.cu │ ├── 8192_256_1024.cu │ ├── 8192_256_12288.cu │ ├── 8192_256_128.cu │ ├── 8192_256_16384.cu │ ├── 8192_256_2048.cu │ ├── 8192_256_256.cu │ ├── 8192_256_4096.cu │ ├── 8192_256_512.cu │ ├── 8192_256_64.cu │ ├── 8192_256_8192.cu │ ├── 8192_4096_1024.cu │ ├── 8192_4096_12288.cu │ ├── 8192_4096_128.cu │ ├── 8192_4096_16384.cu │ ├── 8192_4096_2048.cu │ ├── 8192_4096_256.cu │ ├── 8192_4096_4096.cu │ ├── 8192_4096_512.cu │ ├── 8192_4096_64.cu │ ├── 8192_4096_8192.cu │ ├── 8192_512_1024.cu │ ├── 8192_512_12288.cu │ ├── 8192_512_128.cu │ ├── 8192_512_16384.cu │ ├── 8192_512_2048.cu │ ├── 8192_512_256.cu │ ├── 8192_512_4096.cu │ ├── 8192_512_512.cu │ ├── 8192_512_64.cu │ ├── 8192_512_8192.cu │ ├── 8192_64_1024.cu │ ├── 8192_64_12288.cu │ ├── 8192_64_128.cu │ ├── 8192_64_16384.cu │ ├── 8192_64_2048.cu │ ├── 8192_64_256.cu │ ├── 8192_64_4096.cu │ ├── 8192_64_512.cu │ ├── 8192_64_64.cu │ ├── 8192_64_8192.cu │ ├── 8192_8192_1024.cu │ ├── 8192_8192_12288.cu │ ├── 8192_8192_128.cu │ ├── 8192_8192_16384.cu │ ├── 8192_8192_2048.cu │ ├── 8192_8192_256.cu │ ├── 8192_8192_4096.cu │ ├── 8192_8192_512.cu │ ├── 8192_8192_64.cu │ └── 8192_8192_8192.cu ├── pybind └── hgemm.cc ├── randn_correctness_check.py ├── summarize_result.py ├── tools └── utils.py └── zero_one_correctness_check.py /.gitignore: -------------------------------------------------------------------------------- 1 | kernels/final_eval.json 2 | *.pyc 3 | results -------------------------------------------------------------------------------- /.vscode/settings.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/.vscode/settings.json -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/LICENSE.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/README.md -------------------------------------------------------------------------------- /assets/benchmark_comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/assets/benchmark_comparison.png -------------------------------------------------------------------------------- /assets/header.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/assets/header.png -------------------------------------------------------------------------------- /assets/table.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/assets/table.png -------------------------------------------------------------------------------- /benchmarking_offline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/benchmarking_offline.py -------------------------------------------------------------------------------- /benchmarking_server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/benchmarking_server.py -------------------------------------------------------------------------------- /benchmarking_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/benchmarking_utils.py -------------------------------------------------------------------------------- /compile.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/compile.py -------------------------------------------------------------------------------- /cublas/hgemm_cublas.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/cublas/hgemm_cublas.cu -------------------------------------------------------------------------------- /cublas/hgemm_cublaslt_auto_tuning.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/cublas/hgemm_cublaslt_auto_tuning.cu -------------------------------------------------------------------------------- /cublas/hgemm_cublaslt_heuristic.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/cublas/hgemm_cublaslt_heuristic.cu -------------------------------------------------------------------------------- /eval_one_file.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/eval_one_file.sh -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_12288_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_12288_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_16384_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_16384_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/1024_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/1024_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/12288_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/12288_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_12288_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_12288_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_16384_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_16384_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/128_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/128_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/16384_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/16384_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_12288_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_12288_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_16384_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_16384_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/2048_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/2048_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_12288_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_12288_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_16384_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_16384_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/256_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/256_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_12288_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_12288_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_16384_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_16384_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/4096_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/4096_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/512_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/512_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_1024_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_1024_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_12288_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_12288_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_12288_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_12288_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_12288_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_12288_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_12288_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_12288_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_128_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_128_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_16384_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_16384_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_16384_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_16384_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_16384_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_16384_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_16384_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_16384_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_2048_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_2048_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_256_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_256_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_4096_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_4096_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_512_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_512_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_12288.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_12288.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_16384.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_16384.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/64_8192_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/64_8192_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_1024_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_1024_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_128_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_128_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_128_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_128_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_128_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_128_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_128_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_128_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_2048_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_2048_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_256_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_256_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_256_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_256_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_256_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_256_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_256_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_256_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_4096_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_4096_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_512_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_512_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_512_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_512_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_512_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_512_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_512_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_512_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_1024.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_1024.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_128.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_128.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_2048.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_2048.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_256.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_256.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_4096.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_4096.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_512.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_512.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_64.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_64_8192.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_64_8192.cu -------------------------------------------------------------------------------- /kernels/a100_F16F16F16F16/8192_8192_64.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/kernels/a100_F16F16F16F16/8192_8192_64.cu -------------------------------------------------------------------------------- /pybind/hgemm.cc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/pybind/hgemm.cc -------------------------------------------------------------------------------- /randn_correctness_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/randn_correctness_check.py -------------------------------------------------------------------------------- /summarize_result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/summarize_result.py -------------------------------------------------------------------------------- /tools/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/tools/utils.py -------------------------------------------------------------------------------- /zero_one_correctness_check.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/deepreinforce-ai/CUDA-L2/HEAD/zero_one_correctness_check.py --------------------------------------------------------------------------------