├── .gitignore ├── Data ├── Ruler │ ├── prepare.py │ ├── synthetic.yaml │ ├── synthetic │ │ ├── common_words_extraction.py │ │ ├── constants.py │ │ ├── freq_words_extraction.py │ │ ├── json │ │ │ ├── PaulGrahamEssays.json │ │ │ ├── PaulGrahamEssays_URLs.txt │ │ │ ├── download_paulgraham_essay.py │ │ │ ├── download_qa_dataset.sh │ │ │ ├── hotpotqa.json │ │ │ └── squad.json │ │ ├── niah.py │ │ ├── qa.py │ │ └── variable_tracking.py │ ├── template.py │ └── tokenizer.py ├── __init__.py ├── c4_small.json ├── data_converter.py └── pg19 │ ├── pg19-test.json │ └── pg19-train.json ├── Engine ├── SnapKV │ ├── __init__.py │ ├── backend.py │ ├── backend_draft.py │ ├── model.py │ └── model_draft.py ├── StreamingLLM │ ├── __init__.py │ ├── backend.py │ ├── backend_draft.py │ ├── model.py │ └── model_draft.py ├── __init__.py ├── quantize.py ├── tp.py └── utils.py ├── LICENSE ├── README.md ├── convert_hf_checkpoint.py ├── download.py ├── index.html ├── notes.txt ├── pages ├── index.html └── static │ ├── Triforce.ttf │ ├── css │ ├── bulma-carousel.min.css │ ├── bulma-slider.min.css │ ├── bulma.css.map.txt │ ├── bulma.min.css │ ├── fontawesome.all.min.css │ └── index.css │ ├── images │ ├── TriForce.gif │ ├── Verification.png │ ├── arithmetic_intensity.png │ ├── draft_2_target.png │ ├── draft_to_target_llama2.png │ ├── draft_to_target_llama3.png │ ├── draft_to_target_mem_ratio_llama2.png │ ├── draft_to_target_mem_ratio_llama3.png │ ├── frac_fwd_pass.png │ ├── icons │ │ ├── Drafting.png │ │ ├── Fast.png │ │ ├── GPU.png │ │ ├── Idea.png │ │ ├── Llama.png │ │ ├── MagicDec.png │ │ ├── Magic_wand_icon.png │ │ ├── MathematicsCompass.png │ │ ├── Observation.png │ │ ├── Stonks_emoji.png │ │ ├── Switch.png │ │ ├── Telescope.png │ │ ├── choice_of_eggs.png │ │ ├── deep-dive.png │ │ ├── demo.png │ │ ├── experiments.png │ │ ├── experiments.svg │ │ ├── math.svg │ │ ├── revisit.png │ │ ├── revisit.svg │ │ ├── sequoia.png │ │ ├── specdec.png │ │ └── timepassing.png │ ├── kvloadtime.png │ ├── speedups_budget512.png │ ├── ver_2_reg_llama2.png │ ├── ver_2_reg_llama3.png │ └── verify_2_autoreg.png │ ├── js │ ├── bulma-carousel.js │ ├── bulma-carousel.min.js │ ├── bulma-slider.js │ ├── bulma-slider.min.js │ ├── fontawesome.all.min.js │ ├── index.js │ └── plots │ │ ├── throughput_latency.js │ │ └── throughput_latency_smaller.js │ ├── pdfs │ └── sample.pdf │ └── videos │ └── TriForce.mp4 ├── requirements.txt ├── static ├── Triforce.ttf ├── css │ ├── bulma-carousel.min.css │ ├── bulma-slider.min.css │ ├── bulma.css.map.txt │ ├── bulma.min.css │ ├── fontawesome.all.min.css │ └── index.css ├── images │ ├── TriForce.gif │ ├── Verification.png │ ├── arithmetic_intensity.png │ ├── draft_to_target_llama2.png │ ├── draft_to_target_llama3.png │ ├── draft_to_target_mem_ratio_llama2.png │ ├── draft_to_target_mem_ratio_llama3.png │ ├── icons │ │ ├── Drafting.png │ │ ├── Fast.png │ │ ├── GPU.png │ │ ├── Idea.png │ │ ├── Llama.png │ │ ├── MagicDec.png │ │ ├── Magic_wand_icon.png │ │ ├── MathematicsCompass.png │ │ ├── Observation.png │ │ ├── Stonks_emoji.png │ │ ├── Switch.png │ │ ├── Telescope.png │ │ ├── choice_of_eggs.png │ │ ├── demo.png │ │ ├── experiments.png │ │ ├── experiments.svg │ │ ├── math.svg │ │ ├── revisit.png │ │ ├── revisit.svg │ │ └── timepassing.png │ ├── kvloadtime.png │ ├── speedups_budget512.png │ ├── ver_2_reg_llama2.png │ └── ver_2_reg_llama3.png ├── js │ ├── bulma-carousel.js │ ├── bulma-carousel.min.js │ ├── bulma-slider.js │ ├── bulma-slider.min.js │ ├── fontawesome.all.min.js │ ├── index.js │ └── plots │ │ ├── throughput_latency.js │ │ └── throughput_latency_smaller.js ├── pdfs │ └── sample.pdf └── videos │ └── TriForce.mp4 ├── test.html └── tests ├── SnapKV ├── longspec_benchmark.py └── selfspec_benchmark.py ├── StreamingLLM ├── longspec_benchmark.py └── selfspec_benchmark.py └── baseline_benchmark.py /.gitignore: -------------------------------------------------------------------------------- 1 | **/__pycache__ 2 | **/*.pyc 3 | .DS_Store 4 | -------------------------------------------------------------------------------- /Data/Ruler/prepare.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/prepare.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic.yaml -------------------------------------------------------------------------------- /Data/Ruler/synthetic/common_words_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/common_words_extraction.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/constants.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic/freq_words_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/freq_words_extraction.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic/json/PaulGrahamEssays.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/json/PaulGrahamEssays.json -------------------------------------------------------------------------------- /Data/Ruler/synthetic/json/PaulGrahamEssays_URLs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/json/PaulGrahamEssays_URLs.txt -------------------------------------------------------------------------------- /Data/Ruler/synthetic/json/download_paulgraham_essay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/json/download_paulgraham_essay.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic/json/download_qa_dataset.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/json/download_qa_dataset.sh -------------------------------------------------------------------------------- /Data/Ruler/synthetic/json/hotpotqa.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/json/hotpotqa.json -------------------------------------------------------------------------------- /Data/Ruler/synthetic/json/squad.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/json/squad.json -------------------------------------------------------------------------------- /Data/Ruler/synthetic/niah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/niah.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic/qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/qa.py -------------------------------------------------------------------------------- /Data/Ruler/synthetic/variable_tracking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/synthetic/variable_tracking.py -------------------------------------------------------------------------------- /Data/Ruler/template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/template.py -------------------------------------------------------------------------------- /Data/Ruler/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/Ruler/tokenizer.py -------------------------------------------------------------------------------- /Data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Data/c4_small.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/c4_small.json -------------------------------------------------------------------------------- /Data/data_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/data_converter.py -------------------------------------------------------------------------------- /Data/pg19/pg19-test.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/pg19/pg19-test.json -------------------------------------------------------------------------------- /Data/pg19/pg19-train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Data/pg19/pg19-train.json -------------------------------------------------------------------------------- /Engine/SnapKV/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Engine/SnapKV/backend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/SnapKV/backend.py -------------------------------------------------------------------------------- /Engine/SnapKV/backend_draft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/SnapKV/backend_draft.py -------------------------------------------------------------------------------- /Engine/SnapKV/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/SnapKV/model.py -------------------------------------------------------------------------------- /Engine/SnapKV/model_draft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/SnapKV/model_draft.py -------------------------------------------------------------------------------- /Engine/StreamingLLM/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Engine/StreamingLLM/backend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/StreamingLLM/backend.py -------------------------------------------------------------------------------- /Engine/StreamingLLM/backend_draft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/StreamingLLM/backend_draft.py -------------------------------------------------------------------------------- /Engine/StreamingLLM/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/StreamingLLM/model.py -------------------------------------------------------------------------------- /Engine/StreamingLLM/model_draft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/StreamingLLM/model_draft.py -------------------------------------------------------------------------------- /Engine/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /Engine/quantize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/quantize.py -------------------------------------------------------------------------------- /Engine/tp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/tp.py -------------------------------------------------------------------------------- /Engine/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/Engine/utils.py -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/README.md -------------------------------------------------------------------------------- /convert_hf_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/convert_hf_checkpoint.py -------------------------------------------------------------------------------- /download.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/download.py -------------------------------------------------------------------------------- /index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/index.html -------------------------------------------------------------------------------- /notes.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/notes.txt -------------------------------------------------------------------------------- /pages/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/index.html -------------------------------------------------------------------------------- /pages/static/Triforce.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/Triforce.ttf -------------------------------------------------------------------------------- /pages/static/css/bulma-carousel.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/css/bulma-carousel.min.css -------------------------------------------------------------------------------- /pages/static/css/bulma-slider.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/css/bulma-slider.min.css -------------------------------------------------------------------------------- /pages/static/css/bulma.css.map.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/css/bulma.css.map.txt -------------------------------------------------------------------------------- /pages/static/css/bulma.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/css/bulma.min.css -------------------------------------------------------------------------------- /pages/static/css/fontawesome.all.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/css/fontawesome.all.min.css -------------------------------------------------------------------------------- /pages/static/css/index.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/css/index.css -------------------------------------------------------------------------------- /pages/static/images/TriForce.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/TriForce.gif -------------------------------------------------------------------------------- /pages/static/images/Verification.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/Verification.png -------------------------------------------------------------------------------- /pages/static/images/arithmetic_intensity.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/arithmetic_intensity.png -------------------------------------------------------------------------------- /pages/static/images/draft_2_target.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/draft_2_target.png -------------------------------------------------------------------------------- /pages/static/images/draft_to_target_llama2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/draft_to_target_llama2.png -------------------------------------------------------------------------------- /pages/static/images/draft_to_target_llama3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/draft_to_target_llama3.png -------------------------------------------------------------------------------- /pages/static/images/draft_to_target_mem_ratio_llama2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/draft_to_target_mem_ratio_llama2.png -------------------------------------------------------------------------------- /pages/static/images/draft_to_target_mem_ratio_llama3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/draft_to_target_mem_ratio_llama3.png -------------------------------------------------------------------------------- /pages/static/images/frac_fwd_pass.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/frac_fwd_pass.png -------------------------------------------------------------------------------- /pages/static/images/icons/Drafting.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Drafting.png -------------------------------------------------------------------------------- /pages/static/images/icons/Fast.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Fast.png -------------------------------------------------------------------------------- /pages/static/images/icons/GPU.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/GPU.png -------------------------------------------------------------------------------- /pages/static/images/icons/Idea.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Idea.png -------------------------------------------------------------------------------- /pages/static/images/icons/Llama.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Llama.png -------------------------------------------------------------------------------- /pages/static/images/icons/MagicDec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/MagicDec.png -------------------------------------------------------------------------------- /pages/static/images/icons/Magic_wand_icon.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Magic_wand_icon.png -------------------------------------------------------------------------------- /pages/static/images/icons/MathematicsCompass.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/MathematicsCompass.png -------------------------------------------------------------------------------- /pages/static/images/icons/Observation.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Observation.png -------------------------------------------------------------------------------- /pages/static/images/icons/Stonks_emoji.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Stonks_emoji.png -------------------------------------------------------------------------------- /pages/static/images/icons/Switch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Switch.png -------------------------------------------------------------------------------- /pages/static/images/icons/Telescope.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/Telescope.png -------------------------------------------------------------------------------- /pages/static/images/icons/choice_of_eggs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/choice_of_eggs.png -------------------------------------------------------------------------------- /pages/static/images/icons/deep-dive.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/deep-dive.png -------------------------------------------------------------------------------- /pages/static/images/icons/demo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/demo.png -------------------------------------------------------------------------------- /pages/static/images/icons/experiments.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/experiments.png -------------------------------------------------------------------------------- /pages/static/images/icons/experiments.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/experiments.svg -------------------------------------------------------------------------------- /pages/static/images/icons/math.svg: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /pages/static/images/icons/revisit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/revisit.png -------------------------------------------------------------------------------- /pages/static/images/icons/revisit.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/revisit.svg -------------------------------------------------------------------------------- /pages/static/images/icons/sequoia.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/sequoia.png -------------------------------------------------------------------------------- /pages/static/images/icons/specdec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/specdec.png -------------------------------------------------------------------------------- /pages/static/images/icons/timepassing.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/icons/timepassing.png -------------------------------------------------------------------------------- /pages/static/images/kvloadtime.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/kvloadtime.png -------------------------------------------------------------------------------- /pages/static/images/speedups_budget512.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/speedups_budget512.png -------------------------------------------------------------------------------- /pages/static/images/ver_2_reg_llama2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/ver_2_reg_llama2.png -------------------------------------------------------------------------------- /pages/static/images/ver_2_reg_llama3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/ver_2_reg_llama3.png -------------------------------------------------------------------------------- /pages/static/images/verify_2_autoreg.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/images/verify_2_autoreg.png -------------------------------------------------------------------------------- /pages/static/js/bulma-carousel.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/bulma-carousel.js -------------------------------------------------------------------------------- /pages/static/js/bulma-carousel.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/bulma-carousel.min.js -------------------------------------------------------------------------------- /pages/static/js/bulma-slider.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/bulma-slider.js -------------------------------------------------------------------------------- /pages/static/js/bulma-slider.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/bulma-slider.min.js -------------------------------------------------------------------------------- /pages/static/js/fontawesome.all.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/fontawesome.all.min.js -------------------------------------------------------------------------------- /pages/static/js/index.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/index.js -------------------------------------------------------------------------------- /pages/static/js/plots/throughput_latency.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/plots/throughput_latency.js -------------------------------------------------------------------------------- /pages/static/js/plots/throughput_latency_smaller.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/js/plots/throughput_latency_smaller.js -------------------------------------------------------------------------------- /pages/static/pdfs/sample.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/pdfs/sample.pdf -------------------------------------------------------------------------------- /pages/static/videos/TriForce.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/pages/static/videos/TriForce.mp4 -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/requirements.txt -------------------------------------------------------------------------------- /static/Triforce.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/Triforce.ttf -------------------------------------------------------------------------------- /static/css/bulma-carousel.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/css/bulma-carousel.min.css -------------------------------------------------------------------------------- /static/css/bulma-slider.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/css/bulma-slider.min.css -------------------------------------------------------------------------------- /static/css/bulma.css.map.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/css/bulma.css.map.txt -------------------------------------------------------------------------------- /static/css/bulma.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/css/bulma.min.css -------------------------------------------------------------------------------- /static/css/fontawesome.all.min.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/css/fontawesome.all.min.css -------------------------------------------------------------------------------- /static/css/index.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/css/index.css -------------------------------------------------------------------------------- /static/images/TriForce.gif: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/TriForce.gif -------------------------------------------------------------------------------- /static/images/Verification.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/Verification.png -------------------------------------------------------------------------------- /static/images/arithmetic_intensity.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/arithmetic_intensity.png -------------------------------------------------------------------------------- /static/images/draft_to_target_llama2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/draft_to_target_llama2.png -------------------------------------------------------------------------------- /static/images/draft_to_target_llama3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/draft_to_target_llama3.png -------------------------------------------------------------------------------- /static/images/draft_to_target_mem_ratio_llama2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/draft_to_target_mem_ratio_llama2.png -------------------------------------------------------------------------------- /static/images/draft_to_target_mem_ratio_llama3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/draft_to_target_mem_ratio_llama3.png -------------------------------------------------------------------------------- /static/images/icons/Drafting.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Drafting.png -------------------------------------------------------------------------------- /static/images/icons/Fast.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Fast.png -------------------------------------------------------------------------------- /static/images/icons/GPU.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/GPU.png -------------------------------------------------------------------------------- /static/images/icons/Idea.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Idea.png -------------------------------------------------------------------------------- /static/images/icons/Llama.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Llama.png -------------------------------------------------------------------------------- /static/images/icons/MagicDec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/MagicDec.png -------------------------------------------------------------------------------- /static/images/icons/Magic_wand_icon.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Magic_wand_icon.png -------------------------------------------------------------------------------- /static/images/icons/MathematicsCompass.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/MathematicsCompass.png -------------------------------------------------------------------------------- /static/images/icons/Observation.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Observation.png -------------------------------------------------------------------------------- /static/images/icons/Stonks_emoji.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Stonks_emoji.png -------------------------------------------------------------------------------- /static/images/icons/Switch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Switch.png -------------------------------------------------------------------------------- /static/images/icons/Telescope.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/Telescope.png -------------------------------------------------------------------------------- /static/images/icons/choice_of_eggs.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/choice_of_eggs.png -------------------------------------------------------------------------------- /static/images/icons/demo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/demo.png -------------------------------------------------------------------------------- /static/images/icons/experiments.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/experiments.png -------------------------------------------------------------------------------- /static/images/icons/experiments.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/experiments.svg -------------------------------------------------------------------------------- /static/images/icons/math.svg: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /static/images/icons/revisit.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/revisit.png -------------------------------------------------------------------------------- /static/images/icons/revisit.svg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/revisit.svg -------------------------------------------------------------------------------- /static/images/icons/timepassing.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/icons/timepassing.png -------------------------------------------------------------------------------- /static/images/kvloadtime.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/kvloadtime.png -------------------------------------------------------------------------------- /static/images/speedups_budget512.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/speedups_budget512.png -------------------------------------------------------------------------------- /static/images/ver_2_reg_llama2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/ver_2_reg_llama2.png -------------------------------------------------------------------------------- /static/images/ver_2_reg_llama3.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/images/ver_2_reg_llama3.png -------------------------------------------------------------------------------- /static/js/bulma-carousel.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/bulma-carousel.js -------------------------------------------------------------------------------- /static/js/bulma-carousel.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/bulma-carousel.min.js -------------------------------------------------------------------------------- /static/js/bulma-slider.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/bulma-slider.js -------------------------------------------------------------------------------- /static/js/bulma-slider.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/bulma-slider.min.js -------------------------------------------------------------------------------- /static/js/fontawesome.all.min.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/fontawesome.all.min.js -------------------------------------------------------------------------------- /static/js/index.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/index.js -------------------------------------------------------------------------------- /static/js/plots/throughput_latency.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/plots/throughput_latency.js -------------------------------------------------------------------------------- /static/js/plots/throughput_latency_smaller.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/js/plots/throughput_latency_smaller.js -------------------------------------------------------------------------------- /static/pdfs/sample.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/pdfs/sample.pdf -------------------------------------------------------------------------------- /static/videos/TriForce.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/static/videos/TriForce.mp4 -------------------------------------------------------------------------------- /test.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/test.html -------------------------------------------------------------------------------- /tests/SnapKV/longspec_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/tests/SnapKV/longspec_benchmark.py -------------------------------------------------------------------------------- /tests/SnapKV/selfspec_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/tests/SnapKV/selfspec_benchmark.py -------------------------------------------------------------------------------- /tests/StreamingLLM/longspec_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/tests/StreamingLLM/longspec_benchmark.py -------------------------------------------------------------------------------- /tests/StreamingLLM/selfspec_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/tests/StreamingLLM/selfspec_benchmark.py -------------------------------------------------------------------------------- /tests/baseline_benchmark.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Infini-AI-Lab/MagicDec/HEAD/tests/baseline_benchmark.py --------------------------------------------------------------------------------