├── .github ├── ISSUE_TEMPLATE │ ├── bug_report.md │ ├── config.yml │ ├── documentation-request.md │ └── feature_request.md └── PULL_REQUEST_TEMPLATE.md ├── .gitignore ├── APPENDIX.md ├── CHANGELOG ├── CLA.md ├── CODE_OF_CONDUCT.md ├── LICENSE ├── README.md ├── SECURITY.md ├── alternative_recipes └── helm-charts │ └── inference │ └── llm-benchmarks │ ├── .gitignore │ ├── README.md │ ├── llm-benchmark-chart │ ├── .helmignore │ ├── Chart.yaml │ ├── example-vllm-benchmark_output.txt │ ├── templates │ │ ├── _helpers.tpl │ │ ├── client │ │ │ ├── job.yaml │ │ │ └── serviceaccount.yaml │ │ ├── configmap-metrics.yaml │ │ └── server │ │ │ ├── deployment.yaml │ │ │ └── service.yaml │ └── values.yaml │ ├── sg-llm-server-values.yaml │ ├── vllm-embedding-server-values.yaml │ ├── vllm-llm-server-values.yaml │ └── vllm-server-values.yaml ├── cli ├── llmb-install │ ├── CHANGELOG.md │ ├── README.md │ ├── docs │ │ ├── headless-installation.md │ │ ├── recipe_guide.md │ │ └── tools.md │ ├── example_config.yaml │ ├── pyproject.toml │ └── src │ │ └── llmb_install │ │ ├── __init__.py │ │ ├── __main__.py │ │ ├── cli.py │ │ ├── cluster │ │ ├── __init__.py │ │ ├── gpu.py │ │ └── slurm.py │ │ ├── config │ │ ├── __init__.py │ │ ├── cluster.py │ │ ├── headless.py │ │ ├── models.py │ │ └── system.py │ │ ├── constants.py │ │ ├── container │ │ ├── __init__.py │ │ └── image.py │ │ ├── core │ │ ├── __init__.py │ │ ├── dependency.py │ │ ├── installer.py │ │ ├── tools.py │ │ └── workload.py │ │ ├── environment │ │ ├── __init__.py │ │ ├── cache.py │ │ ├── detector.py │ │ ├── venv_manager.py │ │ └── venv_utils.py │ │ ├── ui │ │ ├── __init__.py │ │ ├── interface.py │ │ ├── prompts │ │ │ ├── __init__.py │ │ │ ├── environment.py │ │ │ ├── gpu.py │ │ │ ├── installation.py │ │ │ ├── slurm.py │ │ │ └── workload.py │ │ ├── rich_ui.py │ │ └── simple.py │ │ └── utils │ │ ├── __init__.py │ │ ├── filesystem.py │ │ ├── git.py │ │ └── logging.py └── llmb-run │ ├── Bulk_Examples.md │ ├── CHANGELOG.md │ ├── README.md │ ├── cluster_config.yaml │ ├── example_llmb_config.yaml │ ├── llmb-run │ ├── pyproject.toml │ └── src │ └── llmb_run │ ├── __init__.py │ ├── config_manager.py │ ├── constants.py │ ├── job_launcher.py │ ├── main.py │ ├── metadata_utils.py │ ├── nsys_mount_handler.py │ ├── run_config.py │ ├── slurm_utils.py │ ├── task_manager.py │ └── workload_validator.py ├── common ├── parse_train_timing.sh └── parse_train_timing_mbridge.sh ├── deepseek_r1 └── inference │ ├── dynamo │ ├── README.md │ ├── download_weights.sh │ ├── launch.sh │ ├── metadata.yaml │ └── scripts │ │ ├── bench.sh │ │ ├── gen_yaml.py │ │ ├── postprocess_results.py │ │ ├── set_clock.sh │ │ ├── start_disagg_worker.sh │ │ └── start_frontend.sh │ ├── sglang │ ├── README.md │ ├── download_weights.sh │ ├── launch.sh │ ├── launch_server.sh │ └── metadata.yaml │ └── trtllm │ ├── README.md │ ├── download_weights.sh │ ├── launch.sh │ └── metadata.yaml ├── deepseek_v3 └── pretrain │ ├── README.md │ ├── launch.sh │ └── metadata.yaml ├── gpt-oss └── inference │ ├── README.md │ ├── bench.yaml │ ├── config.yaml │ ├── deploy.yaml │ ├── frontend-service.yaml │ ├── model_cache │ └── model-download.yaml │ └── service.yaml ├── grok1 ├── README.md ├── launch.sh └── metadata.yaml ├── install.sh ├── llama3.1 ├── README.md ├── launch.sh └── metadata.yaml ├── llama3.3 └── inference │ ├── README.md │ ├── download_weights.sh │ ├── launch.sh │ └── metadata.yaml ├── llama3 └── finetune │ ├── README.md │ ├── download_ckpt_dataset.sh │ ├── launch.sh │ └── metadata.yaml ├── microbenchmarks └── cpu_overhead │ ├── README.md │ ├── download_dataset.sh │ ├── launch.sh │ ├── metadata.yaml │ └── pytorch_kernel_launch_latency.py ├── nccl ├── README.md ├── config │ ├── nemofw.user.toml │ ├── systems.toml │ └── testset.toml ├── metadata.yaml └── setup_nccl_launcher.sh ├── nemotron-h ├── README.md ├── launch.sh └── metadata.yaml ├── nemotron4-15b ├── README.md ├── launch.sh ├── metadata.yaml └── setup.sh ├── nemotron4-340b ├── README.md ├── launch.sh ├── metadata.yaml └── setup.sh ├── print_env.sh └── release.yaml /.github/ISSUE_TEMPLATE/bug_report.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/.github/ISSUE_TEMPLATE/bug_report.md -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/.github/ISSUE_TEMPLATE/config.yml -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/documentation-request.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/.github/ISSUE_TEMPLATE/documentation-request.md -------------------------------------------------------------------------------- /.github/ISSUE_TEMPLATE/feature_request.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/.github/ISSUE_TEMPLATE/feature_request.md -------------------------------------------------------------------------------- /.github/PULL_REQUEST_TEMPLATE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/.github/PULL_REQUEST_TEMPLATE.md -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/.gitignore -------------------------------------------------------------------------------- /APPENDIX.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/APPENDIX.md -------------------------------------------------------------------------------- /CHANGELOG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/CHANGELOG -------------------------------------------------------------------------------- /CLA.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/CLA.md -------------------------------------------------------------------------------- /CODE_OF_CONDUCT.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/CODE_OF_CONDUCT.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/README.md -------------------------------------------------------------------------------- /SECURITY.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/SECURITY.md -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/.gitignore -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/README.md -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/.helmignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/.helmignore -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/Chart.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/Chart.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/example-vllm-benchmark_output.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/example-vllm-benchmark_output.txt -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/_helpers.tpl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/_helpers.tpl -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/client/job.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/client/job.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/client/serviceaccount.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/client/serviceaccount.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/configmap-metrics.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/configmap-metrics.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/server/deployment.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/server/deployment.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/server/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/templates/server/service.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/values.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/llm-benchmark-chart/values.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/sg-llm-server-values.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/sg-llm-server-values.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/vllm-embedding-server-values.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/vllm-embedding-server-values.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/vllm-llm-server-values.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/vllm-llm-server-values.yaml -------------------------------------------------------------------------------- /alternative_recipes/helm-charts/inference/llm-benchmarks/vllm-server-values.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/alternative_recipes/helm-charts/inference/llm-benchmarks/vllm-server-values.yaml -------------------------------------------------------------------------------- /cli/llmb-install/CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/CHANGELOG.md -------------------------------------------------------------------------------- /cli/llmb-install/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/README.md -------------------------------------------------------------------------------- /cli/llmb-install/docs/headless-installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/docs/headless-installation.md -------------------------------------------------------------------------------- /cli/llmb-install/docs/recipe_guide.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/docs/recipe_guide.md -------------------------------------------------------------------------------- /cli/llmb-install/docs/tools.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/docs/tools.md -------------------------------------------------------------------------------- /cli/llmb-install/example_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/example_config.yaml -------------------------------------------------------------------------------- /cli/llmb-install/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/pyproject.toml -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/__main__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/cli.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/cluster/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/cluster/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/cluster/gpu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/cluster/gpu.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/cluster/slurm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/cluster/slurm.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/config/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/config/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/config/cluster.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/config/cluster.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/config/headless.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/config/headless.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/config/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/config/models.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/config/system.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/config/system.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/constants.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/container/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/container/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/container/image.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/container/image.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/core/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/core/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/core/dependency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/core/dependency.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/core/installer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/core/installer.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/core/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/core/tools.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/core/workload.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/core/workload.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/environment/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/environment/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/environment/cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/environment/cache.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/environment/detector.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/environment/detector.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/environment/venv_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/environment/venv_manager.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/environment/venv_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/environment/venv_utils.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/interface.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/prompts/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/prompts/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/prompts/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/prompts/environment.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/prompts/gpu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/prompts/gpu.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/prompts/installation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/prompts/installation.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/prompts/slurm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/prompts/slurm.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/prompts/workload.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/prompts/workload.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/rich_ui.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/rich_ui.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/ui/simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/ui/simple.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/utils/__init__.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/utils/filesystem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/utils/filesystem.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/utils/git.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/utils/git.py -------------------------------------------------------------------------------- /cli/llmb-install/src/llmb_install/utils/logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-install/src/llmb_install/utils/logging.py -------------------------------------------------------------------------------- /cli/llmb-run/Bulk_Examples.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/Bulk_Examples.md -------------------------------------------------------------------------------- /cli/llmb-run/CHANGELOG.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/CHANGELOG.md -------------------------------------------------------------------------------- /cli/llmb-run/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/README.md -------------------------------------------------------------------------------- /cli/llmb-run/cluster_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/cluster_config.yaml -------------------------------------------------------------------------------- /cli/llmb-run/example_llmb_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/example_llmb_config.yaml -------------------------------------------------------------------------------- /cli/llmb-run/llmb-run: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/llmb-run -------------------------------------------------------------------------------- /cli/llmb-run/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/pyproject.toml -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/__init__.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/config_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/config_manager.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/constants.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/job_launcher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/job_launcher.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/main.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/metadata_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/metadata_utils.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/nsys_mount_handler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/nsys_mount_handler.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/run_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/run_config.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/slurm_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/slurm_utils.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/task_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/task_manager.py -------------------------------------------------------------------------------- /cli/llmb-run/src/llmb_run/workload_validator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/cli/llmb-run/src/llmb_run/workload_validator.py -------------------------------------------------------------------------------- /common/parse_train_timing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/common/parse_train_timing.sh -------------------------------------------------------------------------------- /common/parse_train_timing_mbridge.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/common/parse_train_timing_mbridge.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/README.md -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/download_weights.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/download_weights.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/launch.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/metadata.yaml -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/scripts/bench.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/scripts/bench.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/scripts/gen_yaml.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/scripts/gen_yaml.py -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/scripts/postprocess_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/scripts/postprocess_results.py -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/scripts/set_clock.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/scripts/set_clock.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/scripts/start_disagg_worker.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/scripts/start_disagg_worker.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/dynamo/scripts/start_frontend.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/dynamo/scripts/start_frontend.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/sglang/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/sglang/README.md -------------------------------------------------------------------------------- /deepseek_r1/inference/sglang/download_weights.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/sglang/download_weights.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/sglang/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/sglang/launch.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/sglang/launch_server.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/sglang/launch_server.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/sglang/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/sglang/metadata.yaml -------------------------------------------------------------------------------- /deepseek_r1/inference/trtllm/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/trtllm/README.md -------------------------------------------------------------------------------- /deepseek_r1/inference/trtllm/download_weights.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/trtllm/download_weights.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/trtllm/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/trtllm/launch.sh -------------------------------------------------------------------------------- /deepseek_r1/inference/trtllm/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_r1/inference/trtllm/metadata.yaml -------------------------------------------------------------------------------- /deepseek_v3/pretrain/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_v3/pretrain/README.md -------------------------------------------------------------------------------- /deepseek_v3/pretrain/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_v3/pretrain/launch.sh -------------------------------------------------------------------------------- /deepseek_v3/pretrain/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/deepseek_v3/pretrain/metadata.yaml -------------------------------------------------------------------------------- /gpt-oss/inference/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/README.md -------------------------------------------------------------------------------- /gpt-oss/inference/bench.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/bench.yaml -------------------------------------------------------------------------------- /gpt-oss/inference/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/config.yaml -------------------------------------------------------------------------------- /gpt-oss/inference/deploy.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/deploy.yaml -------------------------------------------------------------------------------- /gpt-oss/inference/frontend-service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/frontend-service.yaml -------------------------------------------------------------------------------- /gpt-oss/inference/model_cache/model-download.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/model_cache/model-download.yaml -------------------------------------------------------------------------------- /gpt-oss/inference/service.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/gpt-oss/inference/service.yaml -------------------------------------------------------------------------------- /grok1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/grok1/README.md -------------------------------------------------------------------------------- /grok1/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/grok1/launch.sh -------------------------------------------------------------------------------- /grok1/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/grok1/metadata.yaml -------------------------------------------------------------------------------- /install.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/install.sh -------------------------------------------------------------------------------- /llama3.1/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.1/README.md -------------------------------------------------------------------------------- /llama3.1/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.1/launch.sh -------------------------------------------------------------------------------- /llama3.1/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.1/metadata.yaml -------------------------------------------------------------------------------- /llama3.3/inference/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.3/inference/README.md -------------------------------------------------------------------------------- /llama3.3/inference/download_weights.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.3/inference/download_weights.sh -------------------------------------------------------------------------------- /llama3.3/inference/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.3/inference/launch.sh -------------------------------------------------------------------------------- /llama3.3/inference/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3.3/inference/metadata.yaml -------------------------------------------------------------------------------- /llama3/finetune/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3/finetune/README.md -------------------------------------------------------------------------------- /llama3/finetune/download_ckpt_dataset.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3/finetune/download_ckpt_dataset.sh -------------------------------------------------------------------------------- /llama3/finetune/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3/finetune/launch.sh -------------------------------------------------------------------------------- /llama3/finetune/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/llama3/finetune/metadata.yaml -------------------------------------------------------------------------------- /microbenchmarks/cpu_overhead/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/microbenchmarks/cpu_overhead/README.md -------------------------------------------------------------------------------- /microbenchmarks/cpu_overhead/download_dataset.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/microbenchmarks/cpu_overhead/download_dataset.sh -------------------------------------------------------------------------------- /microbenchmarks/cpu_overhead/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/microbenchmarks/cpu_overhead/launch.sh -------------------------------------------------------------------------------- /microbenchmarks/cpu_overhead/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/microbenchmarks/cpu_overhead/metadata.yaml -------------------------------------------------------------------------------- /microbenchmarks/cpu_overhead/pytorch_kernel_launch_latency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/microbenchmarks/cpu_overhead/pytorch_kernel_launch_latency.py -------------------------------------------------------------------------------- /nccl/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nccl/README.md -------------------------------------------------------------------------------- /nccl/config/nemofw.user.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nccl/config/nemofw.user.toml -------------------------------------------------------------------------------- /nccl/config/systems.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nccl/config/systems.toml -------------------------------------------------------------------------------- /nccl/config/testset.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nccl/config/testset.toml -------------------------------------------------------------------------------- /nccl/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nccl/metadata.yaml -------------------------------------------------------------------------------- /nccl/setup_nccl_launcher.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nccl/setup_nccl_launcher.sh -------------------------------------------------------------------------------- /nemotron-h/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron-h/README.md -------------------------------------------------------------------------------- /nemotron-h/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron-h/launch.sh -------------------------------------------------------------------------------- /nemotron-h/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron-h/metadata.yaml -------------------------------------------------------------------------------- /nemotron4-15b/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-15b/README.md -------------------------------------------------------------------------------- /nemotron4-15b/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-15b/launch.sh -------------------------------------------------------------------------------- /nemotron4-15b/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-15b/metadata.yaml -------------------------------------------------------------------------------- /nemotron4-15b/setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-15b/setup.sh -------------------------------------------------------------------------------- /nemotron4-340b/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-340b/README.md -------------------------------------------------------------------------------- /nemotron4-340b/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-340b/launch.sh -------------------------------------------------------------------------------- /nemotron4-340b/metadata.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-340b/metadata.yaml -------------------------------------------------------------------------------- /nemotron4-340b/setup.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/nemotron4-340b/setup.sh -------------------------------------------------------------------------------- /print_env.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/print_env.sh -------------------------------------------------------------------------------- /release.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/NVIDIA/dgxc-benchmarking/HEAD/release.yaml --------------------------------------------------------------------------------