├── .gitignore ├── LICENSE ├── artifact_evaluation ├── ablation │ ├── ablation1_pruning.py │ ├── ablation2_initial.py │ ├── ablation3_quality.py │ ├── config │ │ ├── 3cluster24.ini │ │ ├── cluster10.ini │ │ ├── cluster42.ini │ │ └── machine_profiles.ini │ ├── heuristics │ │ ├── cluster24 │ │ │ └── swarm_sol.ini │ │ └── cluster42 │ │ │ └── swarm_sol.ini │ └── layouts │ │ ├── no_prune_24 │ │ ├── 2024-11-08_16-15-10new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ ├── simulator_cluster.ini │ │ └── trace.txt │ │ ├── no_prune_42 │ │ ├── 2024-11-08_17-04-45new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ ├── simulator_cluster.ini │ │ └── trace.txt │ │ ├── quality │ │ ├── 2024-10-26_19-46-55new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ ├── simulator_cluster.ini │ │ └── trace.txt │ │ ├── raw_24 │ │ ├── 2024-11-08_18-30-19new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ ├── pruned_cluster.ini │ │ ├── simulator_cluster.ini │ │ └── trace.txt │ │ └── raw_42 │ │ ├── 2024-11-08_20-49-18new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ ├── pruned_cluster.ini │ │ ├── simulator_cluster.ini │ │ └── trace.txt ├── ae_readme.md ├── distributed_clusters │ ├── config │ │ ├── 3cluster24.ini │ │ ├── a100.ini │ │ ├── l4.ini │ │ ├── machine_profiles.ini │ │ └── t4.ini │ ├── layout_llama30b │ │ ├── heuristic │ │ │ ├── a100_solution_file.ini │ │ │ ├── l4_solution_file.ini │ │ │ └── t4_solution_file.ini │ │ ├── ilp │ │ │ ├── a100 │ │ │ │ ├── 2024-11-07_17-25-15new.ini │ │ │ │ ├── ilp_model.lp │ │ │ │ ├── ilp_sol.ini │ │ │ │ ├── ilp_solution.sol │ │ │ │ └── simulator_cluster.ini │ │ │ ├── l4 │ │ │ │ ├── 2024-11-07_16-54-07new.ini │ │ │ │ ├── ilp_model.lp │ │ │ │ ├── ilp_sol.ini │ │ │ │ ├── ilp_solution.sol │ │ │ │ └── simulator_cluster.ini │ │ │ └── t4 │ │ │ │ ├── 2024-11-07_16-54-08new.ini │ │ │ │ ├── ilp_model.lp │ │ │ │ ├── ilp_sol.ini │ │ │ │ ├── ilp_solution.sol │ │ │ │ └── simulator_cluster.ini │ │ ├── petals │ │ │ ├── petals_sol.ini │ │ │ └── simulator_cluster.ini │ │ ├── separate │ │ │ ├── a100_simulator_cluster.ini │ │ │ ├── a100_solution_file.ini │ │ │ ├── l4_simulator_cluster.ini │ │ │ ├── l4_solution_file.ini │ │ │ ├── t4_simulator_cluster.ini │ │ │ └── t4_solution_file.ini │ │ └── swarm │ │ │ ├── simulator_cluster.ini │ │ │ └── swarm_sol.ini │ ├── layout_llama70b │ │ ├── ilp │ │ │ ├── 2024-11-07_04-01-30new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── pruned_cluster.ini │ │ │ ├── simulator_cluster.ini │ │ │ └── trace.txt │ │ ├── petals │ │ │ ├── petals_sol.ini │ │ │ └── simulator_cluster.ini │ │ ├── separate │ │ │ ├── a100_simulator_cluster.ini │ │ │ ├── a100_solution_file.ini │ │ │ ├── l4_simulator_cluster.ini │ │ │ ├── l4_solution_file.ini │ │ │ ├── t4_simulator_cluster.ini │ │ │ └── t4_solution_file.ini │ │ └── swarm │ │ │ ├── simulator_cluster.ini │ │ │ └── swarm_sol.ini │ ├── run_all_simulations.sh │ ├── simulation_llama30b │ │ ├── ilp_online │ │ │ ├── a100 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ └── t4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ ├── separate_online │ │ │ ├── a100 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ └── t4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ └── swarm_online │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ ├── simulation_llama70b │ │ ├── ilp_online │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ ├── separate_online │ │ │ ├── a100 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ └── t4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ └── swarm_online │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ ├── step1_gen_cluster.py │ ├── step2_gen_layout.py │ └── step3_simulation.py ├── high_heterogeneity │ ├── config │ │ ├── cluster42.ini │ │ └── machine_profiles.ini │ ├── layout_llama70b │ │ ├── ilp │ │ │ ├── 2024-11-07_15-42-22new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── pruned_cluster.ini │ │ │ ├── simulator_cluster.ini │ │ │ └── trace.txt │ │ ├── petals │ │ │ ├── petals_sol.ini │ │ │ └── simulator_cluster.ini │ │ ├── separate │ │ │ ├── a100 │ │ │ │ ├── simulator_cluster.ini │ │ │ │ └── solution_file.ini │ │ │ ├── l4 │ │ │ │ ├── simulator_cluster.ini │ │ │ │ └── solution_file.ini │ │ │ ├── l4x2 │ │ │ │ ├── simulator_cluster.ini │ │ │ │ └── solution_file.ini │ │ │ ├── t4x2 │ │ │ │ ├── simulator_cluster.ini │ │ │ │ └── solution_file.ini │ │ │ ├── t4x4 │ │ │ │ ├── simulator_cluster.ini │ │ │ │ └── solution_file.ini │ │ │ └── v100_t4 │ │ │ │ ├── simulator_cluster.ini │ │ │ │ └── solution_file.ini │ │ └── swarm │ │ │ ├── simulator_cluster.ini │ │ │ └── swarm_sol.ini │ ├── run_all_simulations.sh │ ├── simulation_llama70b │ │ ├── ilp_online │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ ├── separate_online │ │ │ ├── a100 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4x2 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ └── t4x4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ ├── sp_plus_online │ │ │ ├── a100 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── l4x2 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ ├── t4x4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ │ └── v100_t4 │ │ │ │ ├── decode_latency.pkl │ │ │ │ └── prompt_latency.pkl │ │ └── swarm_online │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ ├── step1_gen_cluster.py │ ├── step2_gen_layout.py │ └── step3_simulation.py ├── model_placement │ ├── config_distributed │ │ ├── 3cluster24.ini │ │ └── machine_profiles.ini │ ├── config_single │ │ ├── cluster24.ini │ │ └── machine_profiles.ini │ ├── layout_distributed │ │ ├── ilp │ │ │ ├── 2024-11-07_04-01-30new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── pruned_cluster.ini │ │ │ ├── simulator_cluster.ini │ │ │ └── trace.txt │ │ ├── petals │ │ │ ├── petals_sol.ini │ │ │ └── simulator_cluster.ini │ │ └── swarm │ │ │ ├── simulator_cluster.ini │ │ │ └── swarm_sol.ini │ ├── layout_single │ │ ├── ilp │ │ │ ├── 2024-11-06_20-00-31new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── real_sys_config.txt │ │ │ ├── simulator_cluster.ini │ │ │ └── trace.txt │ │ ├── petals │ │ │ ├── petals_sol.ini │ │ │ ├── real_sys_config.txt │ │ │ └── simulator_cluster.ini │ │ └── swarm │ │ │ ├── real_sys_config.txt │ │ │ ├── simulator_cluster.ini │ │ │ └── swarm_sol.ini │ ├── models │ │ ├── LICENSE.txt │ │ ├── config.json │ │ ├── tokenizer.json │ │ └── tokenizer_config.json │ ├── real_sys_results │ │ ├── helix │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── petals │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── swarm │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── remote_run.py │ ├── run_all_real_sys_parsing.sh │ ├── run_all_simulations.sh │ ├── setup1_gen_sys_config.py │ ├── setup1_parse_results.py │ ├── setup1_start_host.py │ ├── setup1_start_worker.py │ ├── setup1_visualization.py │ ├── setup2_distributed.py │ └── visualization │ │ ├── helix.jpg │ │ ├── petals.jpg │ │ └── swarm.jpg ├── request_scheduling │ ├── config_distributed │ │ ├── 3cluster24.ini │ │ └── machine_profiles.ini │ ├── config_single │ │ ├── cluster24.ini │ │ └── machine_profiles.ini │ ├── layout_distributed │ │ ├── ilp_sol.ini │ │ └── simulator_cluster.ini │ ├── layout_single │ │ ├── ilp_sol.ini │ │ ├── real_sys_config.txt │ │ └── simulator_cluster.ini │ ├── models │ │ ├── LICENSE.txt │ │ ├── config.json │ │ ├── tokenizer.json │ │ └── tokenizer_config.json │ ├── real_sys_results │ │ ├── helix │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── random │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── swarm │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── remote_run.py │ ├── run_all_real_sys_parsing.sh │ ├── run_all_simulations.sh │ ├── setup1_gen_sys_config.py │ ├── setup1_parse_results.py │ ├── setup1_start_host.py │ ├── setup1_start_worker.py │ └── setup2_distributed.py └── single_cluster │ ├── config │ ├── a100.ini │ ├── cluster24.ini │ ├── l4.ini │ ├── machine_profiles.ini │ └── t4.ini │ ├── layout_llama30b │ ├── ilp │ │ ├── a100 │ │ │ ├── 2024-11-06_02-28-52new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── real_sys_config.txt │ │ │ └── simulator_cluster.ini │ │ ├── l4 │ │ │ ├── 2024-11-06_02-28-52new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── real_sys_config.txt │ │ │ └── simulator_cluster.ini │ │ └── t4 │ │ │ ├── 2024-11-06_02-28-53new.ini │ │ │ ├── ilp_model.lp │ │ │ ├── ilp_sol.ini │ │ │ ├── ilp_solution.sol │ │ │ ├── real_sys_config.txt │ │ │ └── simulator_cluster.ini │ ├── petals │ │ ├── petals_sol.ini │ │ └── simulator_cluster.ini │ ├── separate │ │ ├── a100 │ │ │ └── real_sys_config.txt │ │ ├── a100_simulator_cluster.ini │ │ ├── a100_solution_file.ini │ │ ├── l4 │ │ │ └── real_sys_config.txt │ │ ├── l4_simulator_cluster.ini │ │ ├── l4_solution_file.ini │ │ ├── t4 │ │ │ └── real_sys_config.txt │ │ ├── t4_simulator_cluster.ini │ │ └── t4_solution_file.ini │ └── swarm │ │ ├── real_sys_config.txt │ │ ├── simulator_cluster.ini │ │ └── swarm_sol.ini │ ├── layout_llama70b │ ├── ilp │ │ ├── 2024-11-06_20-00-31new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ ├── real_sys_config.txt │ │ ├── simulator_cluster.ini │ │ └── trace.txt │ ├── petals │ │ ├── petals_sol.ini │ │ └── simulator_cluster.ini │ ├── separate │ │ ├── a100_simulator_cluster.ini │ │ ├── a100_solution_file.ini │ │ ├── l4_simulator_cluster.ini │ │ ├── l4_solution_file.ini │ │ ├── real_sys_config_a100.txt │ │ ├── real_sys_config_l4.txt │ │ ├── real_sys_config_t4.txt │ │ ├── t4_simulator_cluster.ini │ │ └── t4_solution_file.ini │ └── swarm │ │ ├── real_sys_config.txt │ │ ├── simulator_cluster.ini │ │ └── swarm_sol.ini │ ├── models │ ├── llama30b │ │ ├── LICENSE │ │ ├── config.json │ │ ├── tokenizer.json │ │ └── tokenizer_config.json │ └── llama70b │ │ ├── LICENSE.txt │ │ ├── config.json │ │ ├── tokenizer.json │ │ └── tokenizer_config.json │ ├── real_llama30b │ ├── helix_offline │ │ ├── a100 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── l4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── t4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── helix_online │ │ ├── a100 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── l4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── t4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── separate_offline │ │ ├── a100 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── l4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── t4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── separate_online │ │ ├── a100 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── l4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── t4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── swarm_offline │ │ ├── events.txt │ │ └── query_route.txt │ └── swarm_online │ │ ├── events.txt │ │ └── query_route.txt │ ├── real_llama70b │ ├── helix_offline │ │ ├── events.txt │ │ └── query_route.txt │ ├── helix_online │ │ ├── events.txt │ │ └── query_route.txt │ ├── separate_offline │ │ ├── a100 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── l4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── t4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── separate_online │ │ ├── a100 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── l4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── t4 │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── swarm_offline │ │ ├── events.txt │ │ └── query_route.txt │ └── swarm_online │ │ ├── events.txt │ │ └── query_route.txt │ ├── remote_run.py │ ├── run_all_real_sys_parsing.sh │ ├── run_all_simulations.sh │ ├── simulation_llama30b │ ├── ilp_online │ │ ├── a100 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ ├── l4 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ └── t4 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ ├── separate_online │ │ ├── a100 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ ├── l4 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ └── t4 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ └── swarm_online │ │ ├── decode_latency.pkl │ │ └── prompt_latency.pkl │ ├── simulation_llama70b │ ├── ilp_online │ │ ├── decode_latency.pkl │ │ └── prompt_latency.pkl │ ├── separate_online │ │ ├── a100 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ ├── l4 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ │ └── t4 │ │ │ ├── decode_latency.pkl │ │ │ └── prompt_latency.pkl │ └── swarm_online │ │ ├── decode_latency.pkl │ │ └── prompt_latency.pkl │ ├── step1_gen_cluster.py │ ├── step2_gen_layout.py │ ├── step3_simulation.py │ ├── step4_gen_sys_config.py │ ├── step5_start_host.py │ ├── step6_start_worker.py │ └── step7_parse_results.py ├── examples ├── real_sys │ ├── config │ │ ├── machine_profile.ini │ │ ├── real_sys_config.txt │ │ └── single24.ini │ ├── layout │ │ ├── ilp_sol.ini │ │ └── simulator_cluster.ini │ ├── model │ │ ├── LICENSE.txt │ │ ├── config.json │ │ ├── tokenizer.json │ │ └── tokenizer_config.json │ ├── result │ │ ├── maxflow_offline │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── maxflow_online │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── random_offline │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── random_online │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ ├── swarm_offline │ │ │ ├── events.txt │ │ │ └── query_route.txt │ │ └── swarm_online │ │ │ ├── events.txt │ │ │ └── query_route.txt │ ├── step1_generate_system_config.py │ ├── step2_start_host.py │ ├── step3_start_worker.py │ └── step4_parse_results.py └── simulation │ ├── config │ ├── 3cluster24.ini │ ├── machine_profile.ini │ └── single24.ini │ ├── layouts │ ├── homogeneous │ │ ├── homogeneous_sol.ini │ │ └── simulator_cluster.ini │ ├── ilp │ │ ├── 2024-11-05_18-20-39new.ini │ │ ├── ilp_model.lp │ │ ├── ilp_sol.ini │ │ ├── ilp_solution.sol │ │ └── simulator_cluster.ini │ ├── petals │ │ ├── petals_sol.ini │ │ └── simulator_cluster.ini │ ├── swarm │ │ ├── simulator_cluster.ini │ │ └── swarm_sol.ini │ └── verify │ │ ├── 2024-11-05_21-45-08load.ini │ │ ├── ilp_sol.ini │ │ └── simulator_cluster.ini │ ├── sim_files │ ├── maxflow_offline │ │ ├── latency.png │ │ ├── model_placement.jpg │ │ └── throughput.png │ └── maxflow_online │ │ ├── decode_latency.pkl │ │ ├── latency.png │ │ ├── model_placement.jpg │ │ ├── prompt_latency.pkl │ │ └── throughput.png │ ├── step1_gen_cluster.py │ ├── step2_model_placement.py │ ├── step3_run_simulation.py │ └── verify_ilp.py ├── llm_sys ├── comm │ ├── CMakeLists.txt │ ├── build.sh │ ├── setup.py │ ├── src │ │ ├── compute_worker.h │ │ ├── config_parser.h │ │ ├── const.h │ │ ├── host.h │ │ ├── inproc_queue.h │ │ ├── msg.h │ │ ├── poller.h │ │ ├── swarm.h │ │ ├── sys_host_api.cpp │ │ ├── sys_worker_api.cpp │ │ └── utils.h │ └── tests │ │ ├── test_msg.cpp │ │ ├── test_packed_client.cpp │ │ └── test_packed_server.cpp ├── engine │ ├── common.py │ ├── exec_engine.py │ ├── llama.py │ ├── model_runner.py │ ├── scheduler.py │ └── worker.py ├── gen_sys_config.py ├── heuristic_host.py ├── maxflow_host.py ├── utils.py └── worker.py ├── readme.md ├── requirements.txt ├── setup.py └── simulator ├── event_simulator ├── base_node.py ├── cluster_simulator.py ├── compute_node.py ├── coordinator_node.py ├── event.py ├── kv_cache.py ├── latency_analyzer.py ├── logger.py ├── model.py ├── network_link.py ├── query_manager.py ├── request.py └── utils.py ├── initial_layout ├── fake_cluster_generator.py ├── heterogeneous_layout │ ├── petals_layout.py │ └── swarm_layout.py ├── homogeneous_layout │ └── homogeneous_layout.py ├── ilp_layout │ └── ilp_layout.py ├── layout_synthesizer.py └── load_existing_layout.py ├── model_manager ├── base_classes.py ├── example_large │ ├── example_large.py │ ├── example_large_a100.py │ ├── example_large_h100.py │ └── example_large_t4.py ├── example_small │ ├── example_small.py │ ├── example_small_a100.py │ └── example_small_t4.py ├── google_machine_profiles.ini ├── llama1_30b │ ├── a100 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_a100.py │ │ └── prompt_bs2time.csv │ ├── helper.py │ ├── l4 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_l4.py │ │ └── prompt_bs2time.csv │ ├── l4x2 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_l4x2.py │ │ └── prompt_bs2time.csv │ ├── llama1_30b.py │ ├── t4 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_t4.py │ │ └── prompt_bs2time.csv │ ├── t4x2 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_t4x2.py │ │ └── prompt_bs2time.csv │ ├── t4x4 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_t4x4.py │ │ └── prompt_bs2time.csv │ └── v100 │ │ ├── decode_bs2time.csv │ │ ├── llama1_30b_v100.py │ │ └── prompt_bs2time.csv ├── llama2_70b │ ├── a100 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_a100.py │ │ └── prompt_bs2time.csv │ ├── helper.py │ ├── l4 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_l4.py │ │ └── prompt_bs2time.csv │ ├── l4x2 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_l4x2.py │ │ └── prompt_bs2time.csv │ ├── llama2_70b.py │ ├── t4 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_t4.py │ │ └── prompt_bs2time.csv │ ├── t4x2 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_t4x2.py │ │ └── prompt_bs2time.csv │ ├── t4x4 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_t4x4.py │ │ └── prompt_bs2time.csv │ └── v100 │ │ ├── decode_bs2time.csv │ │ ├── llama2_70b_v100.py │ │ └── prompt_bs2time.csv ├── model_manager.py └── template_machine_on_node.py ├── scheduler ├── base_scheduler.py ├── execution_policy.py ├── global_maxflow │ ├── global_maxflow_scheduler.py │ ├── interleaved_weighted_round_robin.py │ ├── kv_expectation.py │ ├── network_flow.py │ └── scheduler_core.py ├── local_maxflow │ ├── maxflow_scheduler.py │ └── maxflow_utils.py ├── naive_scheduler.py ├── shortest_queue │ └── shortest_queue_scheduler.py └── swarm │ └── swarm_scheduler.py └── trace_generator ├── arrival_rate ├── azure_code_arrive_time.pkl └── azure_conv_arrive_time.pkl ├── arrival_rate_sampler.py ├── length_data ├── alpaca_input.pkl ├── alpaca_output.pkl ├── azure_code_input.pkl ├── azure_code_output.pkl ├── azure_conv_input.pkl ├── azure_conv_output.pkl ├── shared_gpt_input.pkl └── shared_gpt_output.pkl ├── length_sampler.py ├── simulator_query_feeder.py └── trace_generator.py /.gitignore: -------------------------------------------------------------------------------- 1 | .idea -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/LICENSE -------------------------------------------------------------------------------- /artifact_evaluation/ablation/ablation1_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/ablation1_pruning.py -------------------------------------------------------------------------------- /artifact_evaluation/ablation/ablation2_initial.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/ablation2_initial.py -------------------------------------------------------------------------------- /artifact_evaluation/ablation/ablation3_quality.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/ablation3_quality.py -------------------------------------------------------------------------------- /artifact_evaluation/ablation/config/3cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/config/3cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/config/cluster10.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/config/cluster10.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/config/cluster42.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/config/cluster42.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/config/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/config/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/heuristics/cluster24/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/heuristics/cluster24/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/heuristics/cluster42/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/heuristics/cluster42/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_24/2024-11-08_16-15-10new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_24/2024-11-08_16-15-10new.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_24/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_24/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_24/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_24/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_24/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_24/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_24/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_24/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_24/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_24/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_42/2024-11-08_17-04-45new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_42/2024-11-08_17-04-45new.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_42/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_42/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_42/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_42/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_42/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_42/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_42/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_42/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/no_prune_42/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/no_prune_42/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/quality/2024-10-26_19-46-55new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/quality/2024-10-26_19-46-55new.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/quality/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/quality/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/quality/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/quality/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/quality/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/quality/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/quality/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/quality/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/quality/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/quality/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/2024-11-08_18-30-19new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/2024-11-08_18-30-19new.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/pruned_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/pruned_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_24/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_24/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/2024-11-08_20-49-18new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/2024-11-08_20-49-18new.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/pruned_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/pruned_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/ablation/layouts/raw_42/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ablation/layouts/raw_42/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/ae_readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/ae_readme.md -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/config/3cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/config/3cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/config/a100.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/config/a100.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/config/l4.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/config/l4.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/config/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/config/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/config/t4.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/config/t4.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/heuristic/a100_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/heuristic/a100_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/heuristic/l4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/heuristic/l4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/heuristic/t4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/heuristic/t4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/2024-11-07_17-25-15new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/2024-11-07_17-25-15new.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/a100/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/2024-11-07_16-54-07new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/2024-11-07_16-54-07new.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/l4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/2024-11-07_16-54-08new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/2024-11-07_16-54-08new.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/ilp/t4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/separate/a100_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/separate/a100_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/separate/a100_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/separate/a100_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/separate/l4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/separate/l4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/separate/l4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/separate/l4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/separate/t4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/separate/t4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/separate/t4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/separate/t4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama30b/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama30b/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/2024-11-07_04-01-30new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/2024-11-07_04-01-30new.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/pruned_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/pruned_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/ilp/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/ilp/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/separate/a100_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/separate/a100_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/separate/a100_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/separate/a100_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/separate/l4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/separate/l4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/separate/l4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/separate/l4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/separate/t4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/separate/t4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/separate/t4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/separate/t4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/layout_llama70b/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/layout_llama70b/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/run_all_simulations.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/run_all_simulations.sh -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/ilp_online/t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/separate_online/t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/swarm_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/swarm_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama30b/swarm_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama30b/swarm_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/ilp_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/ilp_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/ilp_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/ilp_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/separate_online/t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/swarm_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/swarm_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/simulation_llama70b/swarm_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/simulation_llama70b/swarm_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/step1_gen_cluster.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/step1_gen_cluster.py -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/step2_gen_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/step2_gen_layout.py -------------------------------------------------------------------------------- /artifact_evaluation/distributed_clusters/step3_simulation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/distributed_clusters/step3_simulation.py -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/config/cluster42.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/config/cluster42.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/config/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/config/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/2024-11-07_15-42-22new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/2024-11-07_15-42-22new.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/pruned_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/pruned_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/ilp/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/a100/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/a100/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/a100/solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/a100/solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4/solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4/solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4x2/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4x2/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4x2/solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/l4x2/solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x2/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x2/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x2/solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x2/solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x4/solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/t4x4/solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/v100_t4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/v100_t4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/separate/v100_t4/solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/separate/v100_t4/solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/layout_llama70b/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/layout_llama70b/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/run_all_simulations.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/run_all_simulations.sh -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/ilp_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/ilp_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/ilp_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/ilp_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4x2/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4x2/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4x2/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/l4x2/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/t4x4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/t4x4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/t4x4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/separate_online/t4x4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4x2/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4x2/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4x2/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/l4x2/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/t4x4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/t4x4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/t4x4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/t4x4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/v100_t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/v100_t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/v100_t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/sp_plus_online/v100_t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/swarm_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/swarm_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/simulation_llama70b/swarm_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/simulation_llama70b/swarm_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/step1_gen_cluster.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/step1_gen_cluster.py -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/step2_gen_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/step2_gen_layout.py -------------------------------------------------------------------------------- /artifact_evaluation/high_heterogeneity/step3_simulation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/high_heterogeneity/step3_simulation.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/config_distributed/3cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/config_distributed/3cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/config_distributed/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/config_distributed/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/config_single/cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/config_single/cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/config_single/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/config_single/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/2024-11-07_04-01-30new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/2024-11-07_04-01-30new.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/pruned_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/pruned_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/ilp/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/ilp/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_distributed/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_distributed/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/2024-11-06_20-00-31new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/2024-11-06_20-00-31new.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/ilp/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/ilp/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/petals/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/petals/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/swarm/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/swarm/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/layout_single/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/layout_single/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/models/LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/models/LICENSE.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/models/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/models/config.json -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/models/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/models/tokenizer.json -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/models/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/models/tokenizer_config.json -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/real_sys_results/helix/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/real_sys_results/helix/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/real_sys_results/helix/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/real_sys_results/helix/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/real_sys_results/petals/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/real_sys_results/petals/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/real_sys_results/petals/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/real_sys_results/petals/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/real_sys_results/swarm/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/real_sys_results/swarm/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/real_sys_results/swarm/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/real_sys_results/swarm/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/remote_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/remote_run.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/run_all_real_sys_parsing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/run_all_real_sys_parsing.sh -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/run_all_simulations.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/run_all_simulations.sh -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/setup1_gen_sys_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/setup1_gen_sys_config.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/setup1_parse_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/setup1_parse_results.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/setup1_start_host.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/setup1_start_host.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/setup1_start_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/setup1_start_worker.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/setup1_visualization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/setup1_visualization.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/setup2_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/setup2_distributed.py -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/visualization/helix.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/visualization/helix.jpg -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/visualization/petals.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/visualization/petals.jpg -------------------------------------------------------------------------------- /artifact_evaluation/model_placement/visualization/swarm.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/model_placement/visualization/swarm.jpg -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/config_distributed/3cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/config_distributed/3cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/config_distributed/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/config_distributed/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/config_single/cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/config_single/cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/config_single/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/config_single/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/layout_distributed/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/layout_distributed/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/layout_distributed/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/layout_distributed/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/layout_single/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/layout_single/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/layout_single/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/layout_single/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/layout_single/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/layout_single/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/models/LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/models/LICENSE.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/models/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/models/config.json -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/models/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/models/tokenizer.json -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/models/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/models/tokenizer_config.json -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/real_sys_results/helix/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/real_sys_results/helix/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/real_sys_results/helix/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/real_sys_results/helix/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/real_sys_results/random/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/real_sys_results/random/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/real_sys_results/random/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/real_sys_results/random/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/real_sys_results/swarm/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/real_sys_results/swarm/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/real_sys_results/swarm/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/real_sys_results/swarm/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/remote_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/remote_run.py -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/run_all_real_sys_parsing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/run_all_real_sys_parsing.sh -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/run_all_simulations.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/run_all_simulations.sh -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/setup1_gen_sys_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/setup1_gen_sys_config.py -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/setup1_parse_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/setup1_parse_results.py -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/setup1_start_host.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/setup1_start_host.py -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/setup1_start_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/setup1_start_worker.py -------------------------------------------------------------------------------- /artifact_evaluation/request_scheduling/setup2_distributed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/request_scheduling/setup2_distributed.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/config/a100.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/config/a100.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/config/cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/config/cluster24.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/config/l4.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/config/l4.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/config/machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/config/machine_profiles.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/config/t4.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/config/t4.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/2024-11-06_02-28-52new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/2024-11-06_02-28-52new.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/a100/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/2024-11-06_02-28-52new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/2024-11-06_02-28-52new.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/l4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/2024-11-06_02-28-53new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/2024-11-06_02-28-53new.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/ilp/t4/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/a100/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/a100/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/a100_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/a100_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/a100_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/a100_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/l4/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/l4/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/l4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/l4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/l4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/l4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/t4/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/t4/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/t4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/t4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/separate/t4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/separate/t4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/swarm/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/swarm/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama30b/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama30b/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/2024-11-06_20-00-31new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/2024-11-06_20-00-31new.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/ilp_model.lp -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/ilp_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/ilp_solution.sol -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/ilp/trace.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/ilp/trace.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/petals/petals_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/a100_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/a100_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/a100_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/a100_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/l4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/l4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/l4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/l4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/real_sys_config_a100.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/real_sys_config_a100.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/real_sys_config_l4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/real_sys_config_l4.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/real_sys_config_t4.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/real_sys_config_t4.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/t4_simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/t4_simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/separate/t4_solution_file.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/separate/t4_solution_file.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/swarm/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/swarm/real_sys_config.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/layout_llama70b/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/layout_llama70b/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama30b/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama30b/LICENSE -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama30b/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama30b/config.json -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama30b/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama30b/tokenizer.json -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama30b/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama30b/tokenizer_config.json -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama70b/LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama70b/LICENSE.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama70b/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama70b/config.json -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama70b/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama70b/tokenizer.json -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/models/llama70b/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/models/llama70b/tokenizer_config.json -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_offline/a100/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_offline/a100/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_offline/a100/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_offline/a100/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_offline/l4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_offline/l4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_offline/l4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_offline/l4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_offline/t4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_offline/t4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_offline/t4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_offline/t4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_online/a100/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_online/a100/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_online/a100/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_online/a100/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_online/l4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_online/l4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_online/l4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_online/l4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_online/t4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_online/t4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/helix_online/t4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/helix_online/t4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_offline/a100/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_offline/a100/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_offline/a100/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_offline/a100/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_offline/l4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_offline/l4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_offline/l4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_offline/l4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_offline/t4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_offline/t4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_offline/t4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_offline/t4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_online/a100/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_online/a100/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_online/a100/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_online/a100/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_online/l4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_online/l4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_online/l4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_online/l4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_online/t4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_online/t4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/separate_online/t4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/separate_online/t4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/swarm_offline/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/swarm_offline/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/swarm_offline/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/swarm_offline/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/swarm_online/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/swarm_online/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama30b/swarm_online/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama30b/swarm_online/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/helix_offline/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/helix_offline/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/helix_offline/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/helix_offline/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/helix_online/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/helix_online/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/helix_online/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/helix_online/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_offline/a100/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_offline/a100/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_offline/a100/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_offline/a100/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_offline/l4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_offline/l4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_offline/l4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_offline/l4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_offline/t4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_offline/t4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_offline/t4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_offline/t4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_online/a100/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_online/a100/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_online/a100/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_online/a100/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_online/l4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_online/l4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_online/l4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_online/l4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_online/t4/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_online/t4/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/separate_online/t4/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/separate_online/t4/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/swarm_offline/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/swarm_offline/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/swarm_offline/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/swarm_offline/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/swarm_online/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/swarm_online/events.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/real_llama70b/swarm_online/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/real_llama70b/swarm_online/query_route.txt -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/remote_run.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/remote_run.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/run_all_real_sys_parsing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/run_all_real_sys_parsing.sh -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/run_all_simulations.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/run_all_simulations.sh -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/ilp_online/t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/separate_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/separate_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/separate_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/separate_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/separate_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/separate_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/separate_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/separate_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/separate_online/t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/separate_online/t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/separate_online/t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/separate_online/t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/swarm_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/swarm_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama30b/swarm_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama30b/swarm_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/ilp_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/ilp_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/ilp_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/ilp_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/separate_online/a100/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/separate_online/a100/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/separate_online/a100/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/separate_online/a100/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/separate_online/l4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/separate_online/l4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/separate_online/l4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/separate_online/l4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/separate_online/t4/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/separate_online/t4/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/separate_online/t4/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/separate_online/t4/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/swarm_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/swarm_online/decode_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/simulation_llama70b/swarm_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/simulation_llama70b/swarm_online/prompt_latency.pkl -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step1_gen_cluster.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step1_gen_cluster.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step2_gen_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step2_gen_layout.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step3_simulation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step3_simulation.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step4_gen_sys_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step4_gen_sys_config.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step5_start_host.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step5_start_host.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step6_start_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step6_start_worker.py -------------------------------------------------------------------------------- /artifact_evaluation/single_cluster/step7_parse_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/artifact_evaluation/single_cluster/step7_parse_results.py -------------------------------------------------------------------------------- /examples/real_sys/config/machine_profile.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/config/machine_profile.ini -------------------------------------------------------------------------------- /examples/real_sys/config/real_sys_config.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/config/real_sys_config.txt -------------------------------------------------------------------------------- /examples/real_sys/config/single24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/config/single24.ini -------------------------------------------------------------------------------- /examples/real_sys/layout/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/layout/ilp_sol.ini -------------------------------------------------------------------------------- /examples/real_sys/layout/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/layout/simulator_cluster.ini -------------------------------------------------------------------------------- /examples/real_sys/model/LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/model/LICENSE.txt -------------------------------------------------------------------------------- /examples/real_sys/model/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/model/config.json -------------------------------------------------------------------------------- /examples/real_sys/model/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/model/tokenizer.json -------------------------------------------------------------------------------- /examples/real_sys/model/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/model/tokenizer_config.json -------------------------------------------------------------------------------- /examples/real_sys/result/maxflow_offline/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/maxflow_offline/events.txt -------------------------------------------------------------------------------- /examples/real_sys/result/maxflow_offline/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/maxflow_offline/query_route.txt -------------------------------------------------------------------------------- /examples/real_sys/result/maxflow_online/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/maxflow_online/events.txt -------------------------------------------------------------------------------- /examples/real_sys/result/maxflow_online/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/maxflow_online/query_route.txt -------------------------------------------------------------------------------- /examples/real_sys/result/random_offline/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/random_offline/events.txt -------------------------------------------------------------------------------- /examples/real_sys/result/random_offline/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/random_offline/query_route.txt -------------------------------------------------------------------------------- /examples/real_sys/result/random_online/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/random_online/events.txt -------------------------------------------------------------------------------- /examples/real_sys/result/random_online/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/random_online/query_route.txt -------------------------------------------------------------------------------- /examples/real_sys/result/swarm_offline/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/swarm_offline/events.txt -------------------------------------------------------------------------------- /examples/real_sys/result/swarm_offline/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/swarm_offline/query_route.txt -------------------------------------------------------------------------------- /examples/real_sys/result/swarm_online/events.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/swarm_online/events.txt -------------------------------------------------------------------------------- /examples/real_sys/result/swarm_online/query_route.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/result/swarm_online/query_route.txt -------------------------------------------------------------------------------- /examples/real_sys/step1_generate_system_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/step1_generate_system_config.py -------------------------------------------------------------------------------- /examples/real_sys/step2_start_host.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/step2_start_host.py -------------------------------------------------------------------------------- /examples/real_sys/step3_start_worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/step3_start_worker.py -------------------------------------------------------------------------------- /examples/real_sys/step4_parse_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/real_sys/step4_parse_results.py -------------------------------------------------------------------------------- /examples/simulation/config/3cluster24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/config/3cluster24.ini -------------------------------------------------------------------------------- /examples/simulation/config/machine_profile.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/config/machine_profile.ini -------------------------------------------------------------------------------- /examples/simulation/config/single24.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/config/single24.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/homogeneous/homogeneous_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/homogeneous/homogeneous_sol.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/homogeneous/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/homogeneous/simulator_cluster.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/ilp/2024-11-05_18-20-39new.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/ilp/2024-11-05_18-20-39new.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/ilp/ilp_model.lp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/ilp/ilp_model.lp -------------------------------------------------------------------------------- /examples/simulation/layouts/ilp/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/ilp/ilp_sol.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/ilp/ilp_solution.sol: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/ilp/ilp_solution.sol -------------------------------------------------------------------------------- /examples/simulation/layouts/ilp/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/ilp/simulator_cluster.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/petals/petals_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/petals/petals_sol.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/petals/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/petals/simulator_cluster.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/swarm/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/swarm/simulator_cluster.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/swarm/swarm_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/swarm/swarm_sol.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/verify/2024-11-05_21-45-08load.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/verify/2024-11-05_21-45-08load.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/verify/ilp_sol.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/verify/ilp_sol.ini -------------------------------------------------------------------------------- /examples/simulation/layouts/verify/simulator_cluster.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/layouts/verify/simulator_cluster.ini -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_offline/latency.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_offline/latency.png -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_offline/model_placement.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_offline/model_placement.jpg -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_offline/throughput.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_offline/throughput.png -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_online/decode_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_online/decode_latency.pkl -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_online/latency.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_online/latency.png -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_online/model_placement.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_online/model_placement.jpg -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_online/prompt_latency.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_online/prompt_latency.pkl -------------------------------------------------------------------------------- /examples/simulation/sim_files/maxflow_online/throughput.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/sim_files/maxflow_online/throughput.png -------------------------------------------------------------------------------- /examples/simulation/step1_gen_cluster.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/step1_gen_cluster.py -------------------------------------------------------------------------------- /examples/simulation/step2_model_placement.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/step2_model_placement.py -------------------------------------------------------------------------------- /examples/simulation/step3_run_simulation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/step3_run_simulation.py -------------------------------------------------------------------------------- /examples/simulation/verify_ilp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/examples/simulation/verify_ilp.py -------------------------------------------------------------------------------- /llm_sys/comm/CMakeLists.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/CMakeLists.txt -------------------------------------------------------------------------------- /llm_sys/comm/build.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/build.sh -------------------------------------------------------------------------------- /llm_sys/comm/setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/setup.py -------------------------------------------------------------------------------- /llm_sys/comm/src/compute_worker.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/compute_worker.h -------------------------------------------------------------------------------- /llm_sys/comm/src/config_parser.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/config_parser.h -------------------------------------------------------------------------------- /llm_sys/comm/src/const.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/const.h -------------------------------------------------------------------------------- /llm_sys/comm/src/host.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/host.h -------------------------------------------------------------------------------- /llm_sys/comm/src/inproc_queue.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/inproc_queue.h -------------------------------------------------------------------------------- /llm_sys/comm/src/msg.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/msg.h -------------------------------------------------------------------------------- /llm_sys/comm/src/poller.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/poller.h -------------------------------------------------------------------------------- /llm_sys/comm/src/swarm.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/swarm.h -------------------------------------------------------------------------------- /llm_sys/comm/src/sys_host_api.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/sys_host_api.cpp -------------------------------------------------------------------------------- /llm_sys/comm/src/sys_worker_api.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/sys_worker_api.cpp -------------------------------------------------------------------------------- /llm_sys/comm/src/utils.h: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/src/utils.h -------------------------------------------------------------------------------- /llm_sys/comm/tests/test_msg.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/tests/test_msg.cpp -------------------------------------------------------------------------------- /llm_sys/comm/tests/test_packed_client.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/tests/test_packed_client.cpp -------------------------------------------------------------------------------- /llm_sys/comm/tests/test_packed_server.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/comm/tests/test_packed_server.cpp -------------------------------------------------------------------------------- /llm_sys/engine/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/engine/common.py -------------------------------------------------------------------------------- /llm_sys/engine/exec_engine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/engine/exec_engine.py -------------------------------------------------------------------------------- /llm_sys/engine/llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/engine/llama.py -------------------------------------------------------------------------------- /llm_sys/engine/model_runner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/engine/model_runner.py -------------------------------------------------------------------------------- /llm_sys/engine/scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/engine/scheduler.py -------------------------------------------------------------------------------- /llm_sys/engine/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/engine/worker.py -------------------------------------------------------------------------------- /llm_sys/gen_sys_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/gen_sys_config.py -------------------------------------------------------------------------------- /llm_sys/heuristic_host.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/heuristic_host.py -------------------------------------------------------------------------------- /llm_sys/maxflow_host.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/maxflow_host.py -------------------------------------------------------------------------------- /llm_sys/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/utils.py -------------------------------------------------------------------------------- /llm_sys/worker.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/llm_sys/worker.py -------------------------------------------------------------------------------- /readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/readme.md -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | networkx~=3.2.1 2 | matplotlib~=3.8.2 3 | gurobipy~=11.0.0 -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/setup.py -------------------------------------------------------------------------------- /simulator/event_simulator/base_node.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/base_node.py -------------------------------------------------------------------------------- /simulator/event_simulator/cluster_simulator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/cluster_simulator.py -------------------------------------------------------------------------------- /simulator/event_simulator/compute_node.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/compute_node.py -------------------------------------------------------------------------------- /simulator/event_simulator/coordinator_node.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/coordinator_node.py -------------------------------------------------------------------------------- /simulator/event_simulator/event.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/event.py -------------------------------------------------------------------------------- /simulator/event_simulator/kv_cache.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/kv_cache.py -------------------------------------------------------------------------------- /simulator/event_simulator/latency_analyzer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/latency_analyzer.py -------------------------------------------------------------------------------- /simulator/event_simulator/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/logger.py -------------------------------------------------------------------------------- /simulator/event_simulator/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/model.py -------------------------------------------------------------------------------- /simulator/event_simulator/network_link.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/network_link.py -------------------------------------------------------------------------------- /simulator/event_simulator/query_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/query_manager.py -------------------------------------------------------------------------------- /simulator/event_simulator/request.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/request.py -------------------------------------------------------------------------------- /simulator/event_simulator/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/event_simulator/utils.py -------------------------------------------------------------------------------- /simulator/initial_layout/fake_cluster_generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/fake_cluster_generator.py -------------------------------------------------------------------------------- /simulator/initial_layout/heterogeneous_layout/petals_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/heterogeneous_layout/petals_layout.py -------------------------------------------------------------------------------- /simulator/initial_layout/heterogeneous_layout/swarm_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/heterogeneous_layout/swarm_layout.py -------------------------------------------------------------------------------- /simulator/initial_layout/homogeneous_layout/homogeneous_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/homogeneous_layout/homogeneous_layout.py -------------------------------------------------------------------------------- /simulator/initial_layout/ilp_layout/ilp_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/ilp_layout/ilp_layout.py -------------------------------------------------------------------------------- /simulator/initial_layout/layout_synthesizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/layout_synthesizer.py -------------------------------------------------------------------------------- /simulator/initial_layout/load_existing_layout.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/initial_layout/load_existing_layout.py -------------------------------------------------------------------------------- /simulator/model_manager/base_classes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/base_classes.py -------------------------------------------------------------------------------- /simulator/model_manager/example_large/example_large.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_large/example_large.py -------------------------------------------------------------------------------- /simulator/model_manager/example_large/example_large_a100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_large/example_large_a100.py -------------------------------------------------------------------------------- /simulator/model_manager/example_large/example_large_h100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_large/example_large_h100.py -------------------------------------------------------------------------------- /simulator/model_manager/example_large/example_large_t4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_large/example_large_t4.py -------------------------------------------------------------------------------- /simulator/model_manager/example_small/example_small.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_small/example_small.py -------------------------------------------------------------------------------- /simulator/model_manager/example_small/example_small_a100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_small/example_small_a100.py -------------------------------------------------------------------------------- /simulator/model_manager/example_small/example_small_t4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/example_small/example_small_t4.py -------------------------------------------------------------------------------- /simulator/model_manager/google_machine_profiles.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/google_machine_profiles.ini -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/a100/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/a100/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/a100/llama1_30b_a100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/a100/llama1_30b_a100.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/a100/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/a100/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/helper.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/l4/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/l4/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/l4/llama1_30b_l4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/l4/llama1_30b_l4.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/l4/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/l4/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/l4x2/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/l4x2/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/l4x2/llama1_30b_l4x2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/l4x2/llama1_30b_l4x2.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/l4x2/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/l4x2/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/llama1_30b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/llama1_30b.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4/llama1_30b_t4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4/llama1_30b_t4.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4x2/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4x2/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4x2/llama1_30b_t4x2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4x2/llama1_30b_t4x2.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4x2/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4x2/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4x4/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4x4/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4x4/llama1_30b_t4x4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4x4/llama1_30b_t4x4.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/t4x4/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/t4x4/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/v100/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/v100/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/v100/llama1_30b_v100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/v100/llama1_30b_v100.py -------------------------------------------------------------------------------- /simulator/model_manager/llama1_30b/v100/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama1_30b/v100/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/a100/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/a100/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/a100/llama2_70b_a100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/a100/llama2_70b_a100.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/a100/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/a100/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/helper.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/l4/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/l4/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/l4/llama2_70b_l4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/l4/llama2_70b_l4.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/l4/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/l4/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/l4x2/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/l4x2/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/l4x2/llama2_70b_l4x2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/l4x2/llama2_70b_l4x2.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/l4x2/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/l4x2/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/llama2_70b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/llama2_70b.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4/llama2_70b_t4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4/llama2_70b_t4.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4x2/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4x2/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4x2/llama2_70b_t4x2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4x2/llama2_70b_t4x2.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4x2/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4x2/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4x4/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4x4/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4x4/llama2_70b_t4x4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4x4/llama2_70b_t4x4.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/t4x4/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/t4x4/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/v100/decode_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/v100/decode_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/v100/llama2_70b_v100.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/v100/llama2_70b_v100.py -------------------------------------------------------------------------------- /simulator/model_manager/llama2_70b/v100/prompt_bs2time.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/llama2_70b/v100/prompt_bs2time.csv -------------------------------------------------------------------------------- /simulator/model_manager/model_manager.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/model_manager.py -------------------------------------------------------------------------------- /simulator/model_manager/template_machine_on_node.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/model_manager/template_machine_on_node.py -------------------------------------------------------------------------------- /simulator/scheduler/base_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/base_scheduler.py -------------------------------------------------------------------------------- /simulator/scheduler/execution_policy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/execution_policy.py -------------------------------------------------------------------------------- /simulator/scheduler/global_maxflow/global_maxflow_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/global_maxflow/global_maxflow_scheduler.py -------------------------------------------------------------------------------- /simulator/scheduler/global_maxflow/interleaved_weighted_round_robin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/global_maxflow/interleaved_weighted_round_robin.py -------------------------------------------------------------------------------- /simulator/scheduler/global_maxflow/kv_expectation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/global_maxflow/kv_expectation.py -------------------------------------------------------------------------------- /simulator/scheduler/global_maxflow/network_flow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/global_maxflow/network_flow.py -------------------------------------------------------------------------------- /simulator/scheduler/global_maxflow/scheduler_core.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/global_maxflow/scheduler_core.py -------------------------------------------------------------------------------- /simulator/scheduler/local_maxflow/maxflow_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/local_maxflow/maxflow_scheduler.py -------------------------------------------------------------------------------- /simulator/scheduler/local_maxflow/maxflow_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/local_maxflow/maxflow_utils.py -------------------------------------------------------------------------------- /simulator/scheduler/naive_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/naive_scheduler.py -------------------------------------------------------------------------------- /simulator/scheduler/shortest_queue/shortest_queue_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/shortest_queue/shortest_queue_scheduler.py -------------------------------------------------------------------------------- /simulator/scheduler/swarm/swarm_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/scheduler/swarm/swarm_scheduler.py -------------------------------------------------------------------------------- /simulator/trace_generator/arrival_rate/azure_code_arrive_time.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/arrival_rate/azure_code_arrive_time.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/arrival_rate/azure_conv_arrive_time.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/arrival_rate/azure_conv_arrive_time.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/arrival_rate_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/arrival_rate_sampler.py -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/alpaca_input.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/alpaca_input.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/alpaca_output.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/alpaca_output.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/azure_code_input.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/azure_code_input.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/azure_code_output.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/azure_code_output.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/azure_conv_input.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/azure_conv_input.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/azure_conv_output.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/azure_conv_output.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/shared_gpt_input.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/shared_gpt_input.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_data/shared_gpt_output.pkl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_data/shared_gpt_output.pkl -------------------------------------------------------------------------------- /simulator/trace_generator/length_sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/length_sampler.py -------------------------------------------------------------------------------- /simulator/trace_generator/simulator_query_feeder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/simulator_query_feeder.py -------------------------------------------------------------------------------- /simulator/trace_generator/trace_generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Thesys-lab/Helix-ASPLOS25/HEAD/simulator/trace_generator/trace_generator.py --------------------------------------------------------------------------------