├── .gitignore ├── README.md ├── TokenButler_Draft.pdf ├── ablation_results ├── ablation_analysis.py ├── ablation_plots │ ├── Qwen_Qwen2.5-0.5B_decode_jsd_per_layer.pdf │ ├── Qwen_Qwen2.5-0.5B_decode_percdrift_per_layer.pdf │ ├── Qwen_Qwen2.5-0.5B_drift_density_heatmap.png │ ├── Qwen_Qwen2.5-0.5B_drift_trajectory.png │ ├── Qwen_Qwen2.5-0.5B_head_agreement_js_divergence.pdf │ ├── Qwen_Qwen2.5-0.5B_headtok_consistency_js_divergence.pdf │ ├── Qwen_Qwen2.5-0.5B_rank_agreement_violin.pdf │ ├── Qwen_Qwen2.5-0.5B_rankcorr_heatmap.png │ ├── Qwen_Qwen2.5-1.5B_decode_jsd_per_layer.pdf │ ├── Qwen_Qwen2.5-1.5B_decode_percdrift_per_layer.pdf │ ├── Qwen_Qwen2.5-1.5B_drift_density_heatmap.png │ ├── Qwen_Qwen2.5-1.5B_drift_trajectory.png │ ├── Qwen_Qwen2.5-1.5B_head_agreement_js_divergence.pdf │ ├── Qwen_Qwen2.5-1.5B_headtok_consistency_js_divergence.pdf │ ├── Qwen_Qwen2.5-1.5B_rank_agreement_violin.pdf │ ├── Qwen_Qwen2.5-1.5B_rankcorr_heatmap.png │ ├── Qwen_Qwen2.5-14B_decode_jsd_per_layer.pdf │ ├── Qwen_Qwen2.5-14B_decode_percdrift_per_layer.pdf │ ├── Qwen_Qwen2.5-14B_drift_density_heatmap.png │ ├── Qwen_Qwen2.5-14B_drift_trajectory.png │ ├── Qwen_Qwen2.5-14B_head_agreement_js_divergence.pdf │ ├── Qwen_Qwen2.5-14B_headtok_consistency_js_divergence.pdf │ ├── Qwen_Qwen2.5-14B_rank_agreement_violin.pdf │ ├── Qwen_Qwen2.5-3B_decode_jsd_per_layer.pdf │ ├── Qwen_Qwen2.5-3B_decode_percdrift_per_layer.pdf │ ├── Qwen_Qwen2.5-3B_drift_density_heatmap.png │ ├── Qwen_Qwen2.5-3B_drift_trajectory.png │ ├── Qwen_Qwen2.5-3B_head_agreement_js_divergence.pdf │ ├── Qwen_Qwen2.5-3B_headtok_consistency_js_divergence.pdf │ ├── Qwen_Qwen2.5-3B_rank_agreement_violin.pdf │ ├── Qwen_Qwen2.5-3B_rankcorr_heatmap.png │ ├── Qwen_Qwen2.5-7B_decode_jsd_per_layer.pdf │ ├── Qwen_Qwen2.5-7B_decode_percdrift_per_layer.pdf │ ├── Qwen_Qwen2.5-7B_drift_density_heatmap.png │ ├── Qwen_Qwen2.5-7B_drift_trajectory.png │ ├── Qwen_Qwen2.5-7B_head_agreement_js_divergence.pdf │ ├── Qwen_Qwen2.5-7B_headtok_consistency_js_divergence.pdf │ ├── Qwen_Qwen2.5-7B_rank_agreement_violin.pdf │ ├── Qwen_Qwen2.5-7B_rankcorr_heatmap.png │ ├── meta-llama_Llama-2-13b-hf_decode_jsd_per_layer.pdf │ ├── meta-llama_Llama-2-13b-hf_decode_percdrift_per_layer.pdf │ ├── meta-llama_Llama-2-13b-hf_drift_density_heatmap.png │ ├── meta-llama_Llama-2-13b-hf_drift_trajectory.png │ ├── meta-llama_Llama-2-13b-hf_head_agreement_js_divergence.pdf │ ├── meta-llama_Llama-2-13b-hf_headtok_consistency_js_divergence.pdf │ ├── meta-llama_Llama-2-13b-hf_rank_agreement_violin.pdf │ ├── meta-llama_Llama-2-7b-hf_decode_jsd_per_layer.pdf │ ├── meta-llama_Llama-2-7b-hf_decode_percdrift_per_layer.pdf │ ├── meta-llama_Llama-2-7b-hf_drift_density_heatmap.png │ ├── meta-llama_Llama-2-7b-hf_drift_trajectory.png │ ├── meta-llama_Llama-2-7b-hf_head_agreement_js_divergence.pdf │ ├── meta-llama_Llama-2-7b-hf_headtok_consistency_js_divergence.pdf │ ├── meta-llama_Llama-2-7b-hf_rank_agreement_violin.pdf │ ├── meta-llama_Llama-3.1-8B_decode_jsd_per_layer.pdf │ ├── meta-llama_Llama-3.1-8B_decode_percdrift_per_layer.pdf │ ├── meta-llama_Llama-3.1-8B_drift_density_heatmap.png │ ├── meta-llama_Llama-3.1-8B_drift_trajectory.png │ ├── meta-llama_Llama-3.1-8B_head_agreement_js_divergence.pdf │ ├── meta-llama_Llama-3.1-8B_headtok_consistency_js_divergence.pdf │ ├── meta-llama_Llama-3.1-8B_rank_agreement_violin.pdf │ ├── meta-llama_Llama-3.2-1B_decode_jsd_per_layer.pdf │ ├── meta-llama_Llama-3.2-1B_decode_percdrift_per_layer.pdf │ ├── meta-llama_Llama-3.2-1B_drift_density_heatmap.png │ ├── meta-llama_Llama-3.2-1B_drift_trajectory.png │ ├── meta-llama_Llama-3.2-1B_head_agreement_js_divergence.pdf │ ├── meta-llama_Llama-3.2-1B_headtok_consistency_js_divergence.pdf │ ├── meta-llama_Llama-3.2-1B_rank_agreement_violin.pdf │ ├── meta-llama_Llama-3.2-1B_rankcorr_heatmap.png │ ├── meta-llama_Llama-3.2-3B_decode_jsd_per_layer.pdf │ ├── meta-llama_Llama-3.2-3B_decode_percdrift_per_layer.pdf │ ├── meta-llama_Llama-3.2-3B_drift_density_heatmap.png │ ├── meta-llama_Llama-3.2-3B_drift_trajectory.png │ ├── meta-llama_Llama-3.2-3B_head_agreement_js_divergence.pdf │ ├── meta-llama_Llama-3.2-3B_headtok_consistency_js_divergence.pdf │ ├── meta-llama_Llama-3.2-3B_rank_agreement_violin.pdf │ ├── meta-llama_Llama-3.2-3B_rankcorr_heatmap.png │ ├── microsoft_Phi-3-medium-4k-instruct_decode_jsd_per_layer.pdf │ ├── microsoft_Phi-3-medium-4k-instruct_decode_percdrift_per_layer.pdf │ ├── microsoft_Phi-3-medium-4k-instruct_drift_density_heatmap.png │ ├── microsoft_Phi-3-medium-4k-instruct_drift_trajectory.png │ ├── microsoft_Phi-3-medium-4k-instruct_head_agreement_js_divergence.pdf │ ├── microsoft_Phi-3-medium-4k-instruct_headtok_consistency_js_divergence.pdf │ ├── microsoft_Phi-3-medium-4k-instruct_rank_agreement_violin.pdf │ ├── microsoft_Phi-3-mini-4k-instruct_decode_jsd_per_layer.pdf │ ├── microsoft_Phi-3-mini-4k-instruct_decode_percdrift_per_layer.pdf │ ├── microsoft_Phi-3-mini-4k-instruct_drift_density_heatmap.png │ ├── microsoft_Phi-3-mini-4k-instruct_drift_trajectory.png │ ├── microsoft_Phi-3-mini-4k-instruct_head_agreement_js_divergence.pdf │ ├── microsoft_Phi-3-mini-4k-instruct_headtok_consistency_js_divergence.pdf │ ├── microsoft_Phi-3-mini-4k-instruct_rank_agreement_violin.pdf │ ├── microsoft_Phi-3.5-mini-instruct_decode_jsd_per_layer.pdf │ ├── microsoft_Phi-3.5-mini-instruct_decode_percdrift_per_layer.pdf │ ├── microsoft_Phi-3.5-mini-instruct_drift_density_heatmap.png │ ├── microsoft_Phi-3.5-mini-instruct_drift_trajectory.png │ ├── microsoft_Phi-3.5-mini-instruct_head_agreement_js_divergence.pdf │ ├── microsoft_Phi-3.5-mini-instruct_headtok_consistency_js_divergence.pdf │ ├── microsoft_Phi-3.5-mini-instruct_rank_agreement_violin.pdf │ ├── microsoft_phi-4_decode_jsd_per_layer.pdf │ ├── microsoft_phi-4_decode_percdrift_per_layer.pdf │ ├── microsoft_phi-4_head_agreement_js_divergence.pdf │ ├── microsoft_phi-4_headtok_consistency_js_divergence.pdf │ ├── mistralai_Mistral-7B-v0.1_decode_jsd_per_layer.pdf │ ├── mistralai_Mistral-7B-v0.1_decode_percdrift_per_layer.pdf │ ├── mistralai_Mistral-7B-v0.1_drift_density_heatmap.png │ ├── mistralai_Mistral-7B-v0.1_drift_trajectory.png │ ├── mistralai_Mistral-7B-v0.1_head_agreement_js_divergence.pdf │ ├── mistralai_Mistral-7B-v0.1_headtok_consistency_js_divergence.pdf │ ├── mistralai_Mistral-7B-v0.1_rank_agreement_violin.pdf │ └── traces │ │ ├── decode_drift_trajectory │ │ ├── combined_drift_plots.pdf │ │ ├── drift_traj_Qwen_Qwen2.5-0.5B.npy │ │ ├── drift_traj_Qwen_Qwen2.5-14B.npy │ │ ├── drift_traj_Qwen_Qwen2.5-3B.npy │ │ ├── drift_traj_Qwen_Qwen2.5-7B.npy │ │ ├── drift_traj_meta-llama_Llama-2-13b-hf.npy │ │ ├── drift_traj_meta-llama_Llama-2-7b-hf.npy │ │ ├── drift_traj_meta-llama_Llama-3.1-8B.npy │ │ ├── drift_traj_meta-llama_Llama-3.2-1B.npy │ │ ├── drift_traj_meta-llama_Llama-3.2-3B.npy │ │ ├── drift_traj_microsoft_Phi-3-medium-4k-instruct.npy │ │ ├── drift_traj_microsoft_Phi-3-mini-4k-instruct.npy │ │ ├── drift_traj_microsoft_Phi-3.5-mini-instruct.npy │ │ ├── drift_traj_mistralai_Mistral-7B-v0.1.npy │ │ └── drift_trajectories_subplots.pdf │ │ ├── decode_jsd │ │ ├── decode_jsd_Qwen_Qwen2.5-0.5B.npy │ │ ├── decode_jsd_Qwen_Qwen2.5-1.5B.npy │ │ ├── decode_jsd_Qwen_Qwen2.5-14B.npy │ │ ├── decode_jsd_Qwen_Qwen2.5-3B.npy │ │ ├── decode_jsd_Qwen_Qwen2.5-7B.npy │ │ ├── decode_jsd_meta-llama_Llama-2-13b-hf.npy │ │ ├── decode_jsd_meta-llama_Llama-2-7b-hf.npy │ │ ├── decode_jsd_meta-llama_Llama-3.1-8B.npy │ │ ├── decode_jsd_meta-llama_Llama-3.2-1B.npy │ │ ├── decode_jsd_meta-llama_Llama-3.2-3B.npy │ │ ├── decode_jsd_microsoft_Phi-3-medium-4k-instruct.npy │ │ ├── decode_jsd_microsoft_Phi-3-mini-4k-instruct.npy │ │ ├── decode_jsd_microsoft_Phi-3-small-8k-instruct.npy │ │ ├── decode_jsd_microsoft_Phi-3.5-mini-instruct.npy │ │ ├── decode_jsd_microsoft_phi-4.npy │ │ ├── decode_jsd_mistralai_Mistral-7B-v0.1.npy │ │ ├── jsddiv_violin_plot.pdf │ │ └── normalized_decodejsd_subplots.pdf │ │ ├── headagreement_js_div │ │ ├── head_agreement_Qwen_Qwen2.5-0.5B.npy │ │ ├── head_agreement_Qwen_Qwen2.5-1.5B.npy │ │ ├── head_agreement_Qwen_Qwen2.5-14B.npy │ │ ├── head_agreement_Qwen_Qwen2.5-3B.npy │ │ ├── head_agreement_Qwen_Qwen2.5-7B.npy │ │ ├── head_agreement_meta-llama_Llama-2-13b-hf.npy │ │ ├── head_agreement_meta-llama_Llama-2-7b-hf.npy │ │ ├── head_agreement_meta-llama_Llama-3.1-8B.npy │ │ ├── head_agreement_meta-llama_Llama-3.2-1B.npy │ │ ├── head_agreement_meta-llama_Llama-3.2-3B.npy │ │ ├── head_agreement_microsoft_Phi-3-medium-4k-instruct.npy │ │ ├── head_agreement_microsoft_Phi-3-mini-4k-instruct.npy │ │ ├── head_agreement_microsoft_Phi-3-small-8k-instruct.npy │ │ ├── head_agreement_microsoft_Phi-3.5-mini-instruct.npy │ │ ├── head_agreement_microsoft_phi-4.npy │ │ └── head_agreement_mistralai_Mistral-7B-v0.1.npy │ │ ├── percdrift │ │ ├── decode_percdrift_Qwen_Qwen2.5-0.5B.npy │ │ ├── decode_percdrift_Qwen_Qwen2.5-14B.npy │ │ ├── decode_percdrift_Qwen_Qwen2.5-3B.npy │ │ ├── decode_percdrift_Qwen_Qwen2.5-7B.npy │ │ ├── decode_percdrift_meta-llama_Llama-2-13b-hf.npy │ │ ├── decode_percdrift_meta-llama_Llama-2-7b-hf.npy │ │ ├── decode_percdrift_meta-llama_Llama-3.1-8B.npy │ │ ├── decode_percdrift_meta-llama_Llama-3.2-1B.npy │ │ ├── decode_percdrift_meta-llama_Llama-3.2-3B.npy │ │ ├── decode_percdrift_microsoft_Phi-3-medium-4k-instruct.npy │ │ ├── decode_percdrift_microsoft_Phi-3-mini-4k-instruct.npy │ │ ├── decode_percdrift_microsoft_Phi-3-small-8k-instruct.npy │ │ ├── decode_percdrift_microsoft_Phi-3.5-mini-instruct.npy │ │ ├── decode_percdrift_microsoft_phi-4.npy │ │ ├── decode_percdrift_mistralai_Mistral-7B-v0.1.npy │ │ └── percdrift_violin_plot.pdf │ │ ├── rankagreement_allheads │ │ ├── head_agreement_violin_plot_all.pdf │ │ ├── head_agreement_violin_plot_mean.pdf │ │ ├── rank_agreement_Qwen_Qwen2.5-0.5B.npy │ │ ├── rank_agreement_Qwen_Qwen2.5-14B.npy │ │ ├── rank_agreement_Qwen_Qwen2.5-3B.npy │ │ ├── rank_agreement_Qwen_Qwen2.5-7B.npy │ │ ├── rank_agreement_meta-llama_Llama-2-13b-hf.npy │ │ ├── rank_agreement_meta-llama_Llama-2-7b-hf.npy │ │ ├── rank_agreement_meta-llama_Llama-3.1-8B.npy │ │ ├── rank_agreement_meta-llama_Llama-3.2-1B.npy │ │ ├── rank_agreement_meta-llama_Llama-3.2-3B.npy │ │ ├── rank_agreement_microsoft_Phi-3-medium-4k-instruct.npy │ │ ├── rank_agreement_microsoft_Phi-3-mini-4k-instruct.npy │ │ ├── rank_agreement_microsoft_Phi-3.5-mini-instruct.npy │ │ └── rank_agreement_mistralai_Mistral-7B-v0.1.npy │ │ └── tok_js_div │ │ ├── layer_consistency_Qwen_Qwen2.5-0.5B.npy │ │ ├── layer_consistency_Qwen_Qwen2.5-1.5B.npy │ │ ├── layer_consistency_Qwen_Qwen2.5-14B.npy │ │ ├── layer_consistency_Qwen_Qwen2.5-3B.npy │ │ ├── layer_consistency_Qwen_Qwen2.5-7B.npy │ │ ├── layer_consistency_meta-llama_Llama-2-13b-hf.npy │ │ ├── layer_consistency_meta-llama_Llama-2-7b-hf.npy │ │ ├── layer_consistency_meta-llama_Llama-3.1-8B.npy │ │ ├── layer_consistency_meta-llama_Llama-3.2-1B.npy │ │ ├── layer_consistency_meta-llama_Llama-3.2-3B.npy │ │ ├── layer_consistency_microsoft_Phi-3-medium-4k-instruct.npy │ │ ├── layer_consistency_microsoft_Phi-3-mini-4k-instruct.npy │ │ ├── layer_consistency_microsoft_Phi-3-small-8k-instruct.npy │ │ ├── layer_consistency_microsoft_Phi-3.5-mini-instruct.npy │ │ ├── layer_consistency_microsoft_phi-4.npy │ │ ├── layer_consistency_mistralai_Mistral-7B-v0.1.npy │ │ ├── mean_js_divergence_per_layer.pdf │ │ ├── normalized_mean_js_divergence_per_layer.pdf │ │ └── normalized_mean_js_divergence_subplots.pdf ├── ablations.py ├── attn_weights_1.png ├── combined_results.csv ├── csvresults │ ├── L2_7B_2k.csv │ ├── L3_1B_2k.csv │ ├── L3_1B_2k_1PC.csv │ ├── L3_1B_2k_1PC_RAND.csv │ ├── L3_3B_2k.csv │ ├── L3_3B_2k_1PC.csv │ ├── L3_8B_1k.csv │ ├── M7B_1k.csv │ ├── P35mini_1k_1PC.csv │ ├── P3mini_1k_1PC.csv │ └── Q25_3B_2k_1PC.csv ├── drift_to_predacc.pdf ├── evalresults │ ├── L2_7B_2k.csv │ ├── L2_7B_2k_ABL_init.csv │ ├── L2_7B_2k_ABL_lookahead.csv │ ├── L2_7B_2k_ABL_rand.csv │ ├── L2_7B_2k_h2o_true.csv │ ├── L2_7B_2k_oracle.csv │ ├── L2_7B_2k_quest.csv │ ├── L2_7B_2k_quest_P4.csv │ ├── L2_7B_2k_snapkv.csv │ ├── L2_7B_2k_streamingLLM.csv │ ├── L3_1B_2k.csv │ ├── L3_1B_2k_1PC.csv │ ├── L3_1B_2k_1PC_h2o_true.csv │ ├── L3_1B_2k_1PC_oracle.csv │ ├── L3_1B_2k_1PC_quest.csv │ ├── L3_1B_2k_1PC_snapkv.csv │ ├── L3_1B_2k_1PC_streamingLLM.csv │ ├── L3_1B_2k_h2o_true.csv │ ├── L3_1B_2k_oracle.csv │ ├── L3_1B_2k_streamingLLM.csv │ ├── L3_3B_2k_1PC.csv │ ├── L3_3B_2k_1PC_h2o_true.csv │ ├── L3_3B_2k_1PC_oracle.csv │ ├── L3_3B_2k_1PC_quest.csv │ ├── L3_3B_2k_1PC_snapkv.csv │ ├── L3_3B_2k_1PC_streamingLLM.csv │ ├── L3_3B_2k_h2o_true.csv │ ├── L3_3B_2k_streamingLLM.csv │ ├── L3_8B_1k.csv │ ├── L3_8B_1k_h2o_true.csv │ ├── L3_8B_1k_oracle.csv │ ├── L3_8B_1k_quest.csv │ ├── L3_8B_1k_quest_P4.csv │ ├── L3_8B_1k_snapkv.csv │ ├── L3_8B_1k_streamingLLM.csv │ ├── LongChat_snapkv.csv │ ├── M7B_1k.csv │ ├── M7B_1k_h2o_true.csv │ ├── M7B_1k_oracle.csv │ ├── M7B_1k_quest.csv │ ├── M7B_1k_snapkv.csv │ ├── M7B_1k_streamingLLM.csv │ ├── P35mini_1k_1PC.csv │ ├── P35mini_1k_1PC_h2o_true.csv │ ├── P35mini_1k_1PC_oracle.csv │ ├── P35mini_1k_1PC_quest.csv │ ├── P35mini_1k_1PC_snapkv.csv │ ├── P35mini_1k_1PC_streamingLLM.csv │ ├── P3mini_1k_1PC.csv │ ├── P3mini_1k_1PC_h2o_true.csv │ ├── P3mini_1k_1PC_oracle.csv │ ├── P3mini_1k_1PC_quest.csv │ ├── P3mini_1k_1PC_snapkv.csv │ └── P3mini_1k_1PC_streamingLLM.csv ├── gen_data_stats.py ├── gen_latex_collate.py ├── graph_ablate_oracle.py ├── graph_icml.py ├── graph_methods.py ├── graph_reasoning_result.py ├── latex_traces │ └── generated_latex │ │ ├── latex_0.tex │ │ ├── latex_1.tex │ │ ├── latex_2.tex │ │ ├── latex_3.tex │ │ ├── latex_4.tex │ │ ├── latex_5.tex │ │ ├── latex_6.tex │ │ ├── latex_7.tex │ │ ├── latex_8.tex │ │ └── latex_9.tex ├── mask_ExpPred.png ├── mask_h2o_true.png ├── mask_oracle.png ├── mask_quest.png ├── mrcr_results.csv ├── oracleablate_plots │ ├── average_acc_comparison.pdf │ ├── average_acc_comparison_percdiff.pdf │ ├── perplexity_comparison.pdf │ └── perplexity_comparison_percdiff.pdf ├── paramratios.csv ├── perf_results │ └── attn_only_latency.pdf ├── plots │ ├── average_acc_comparison.pdf │ ├── average_acc_comparison_percdiff.pdf │ ├── perplexity_comparison.pdf │ └── perplexity_comparison_percdiff.pdf ├── pred_overhead.csv ├── pred_overhead_werr.csv ├── predonly_overhead.pdf ├── reasoning_result.csv ├── reasoning_results_plots.pdf ├── result_graphs │ ├── llama1b_1pc_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── llama1b_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── llama3b_1pc_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── llama3b_results │ │ ├── arceasy_acc.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── llama7b_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── llama8b_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── mistral7b_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ ├── phi35mini_1pc_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf │ └── phi3mini_1pc_results │ │ ├── arceasy_acc.pdf │ │ ├── average.pdf │ │ ├── average_pct_diff.pdf │ │ ├── hellaswag_acc.pdf │ │ ├── perplexity.pdf │ │ ├── piqa_acc.pdf │ │ └── winogrande_acc.pdf ├── results │ └── results_perc │ │ ├── arceasy_pct_diff.pdf │ │ ├── hellaswag_pct_diff.pdf │ │ ├── piqa_pct_diff.pdf │ │ └── winogrande_pct_diff.pdf ├── threshold_calib_graph.py ├── tokhitacc.csv ├── tokhitacc.pdf ├── tokhitacc_stacked.pdf └── traj_drift_to_tokhitacc.csv ├── accelerator_configs ├── default_config.yaml └── fsdp_config.yaml ├── base_model_eval.py ├── base_sentences.py ├── config ├── huggyllama │ └── llama-7b.json ├── lmsys │ └── vicuna-7b-v1.5-16k.json ├── merge_config.py ├── meta-llama │ ├── Llama-2-70b-chat-hf.json │ ├── Llama-2-70b-hf.json │ ├── Llama-2-7b-chat-hf.json │ ├── Llama-2-7b-hf.json │ └── Meta-Llama-3.1-8B.json └── mistralai │ ├── Mistral-7B-v0.1.json │ └── Mixtral-8x7B-v0.1.json ├── d_sparsity_env.yml ├── figs ├── datasetfig.png ├── mainfig.png └── tokenbutlerlogo.png ├── longbench_utils ├── __init__.py ├── config │ ├── dataset2maxlen.json │ ├── dataset2prompt.json │ └── model2maxlen.json ├── metrics.py └── scorer.py ├── longeval ├── __init__.py ├── data │ ├── __init__.py │ ├── dataset.py │ ├── metrics.py │ ├── niah │ │ └── viz.py │ ├── ruler │ │ ├── create_dataset.sh │ │ ├── prepare.py │ │ ├── synthetic.yaml │ │ ├── synthetic │ │ │ ├── common_words_extraction.py │ │ │ ├── constants.py │ │ │ ├── freq_words_extraction.py │ │ │ ├── json │ │ │ │ ├── PaulGrahamEssays_URLs.txt │ │ │ │ ├── download_paulgraham_essay.py │ │ │ │ └── download_qa_dataset.sh │ │ │ ├── niah.py │ │ │ ├── niah_multiturn.py │ │ │ ├── qa.py │ │ │ └── variable_tracking.py │ │ └── tokenizer.py │ └── utils.py ├── eval_acc.py ├── eval_tokenbutler.py └── evaluator.py ├── main.py ├── main_scripts.sh ├── modify_models ├── __init__.py ├── modify_llama.py ├── modify_llama_baselines.py ├── modify_llama_performance.py ├── modify_mistral.py ├── modify_mistral_baselines.py ├── modify_phi3.py ├── modify_phi3_baselines.py └── modify_qwen.py ├── mrcr_custom.json ├── predictor.py ├── quickplot.py ├── requirements.txt ├── scripts ├── generate_calibration.sh ├── long_finetune.sh ├── testgen.sh └── train_predictors.sh ├── test_generation.py ├── test_hf.py ├── triton_kernels ├── flash_attn.py └── flash_attn_mse_loss.py └── utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/.gitignore -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/README.md -------------------------------------------------------------------------------- /TokenButler_Draft.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/TokenButler_Draft.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_analysis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_analysis.py -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_rankcorr_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-0.5B_rankcorr_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_rankcorr_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-1.5B_rankcorr_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-14B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-14B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-3B_rankcorr_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-3B_rankcorr_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/Qwen_Qwen2.5-7B_rankcorr_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/Qwen_Qwen2.5-7B_rankcorr_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-13b-hf_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-2-7b-hf_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.1-8B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_rankcorr_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-1B_rankcorr_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_rankcorr_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/meta-llama_Llama-3.2-3B_rankcorr_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-medium-4k-instruct_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3-mini-4k-instruct_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_Phi-3.5-mini-instruct_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_phi-4_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_phi-4_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_phi-4_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_phi-4_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_phi-4_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_phi-4_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/microsoft_phi-4_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/microsoft_phi-4_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_decode_jsd_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_decode_jsd_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_decode_percdrift_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_decode_percdrift_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_drift_density_heatmap.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_drift_density_heatmap.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_drift_trajectory.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_drift_trajectory.png -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_head_agreement_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_head_agreement_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_headtok_consistency_js_divergence.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_headtok_consistency_js_divergence.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_rank_agreement_violin.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/mistralai_Mistral-7B-v0.1_rank_agreement_violin.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/combined_drift_plots.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/combined_drift_plots.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-0.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-0.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-14B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-14B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-7B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_Qwen_Qwen2.5-7B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-2-13b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-2-13b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-2-7b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-2-7b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-3.1-8B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-3.1-8B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-3.2-1B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-3.2-1B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-3.2-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_meta-llama_Llama-3.2-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_microsoft_Phi-3-medium-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_microsoft_Phi-3-medium-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_microsoft_Phi-3-mini-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_microsoft_Phi-3-mini-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_microsoft_Phi-3.5-mini-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_microsoft_Phi-3.5-mini-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_mistralai_Mistral-7B-v0.1.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_traj_mistralai_Mistral-7B-v0.1.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_trajectories_subplots.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_drift_trajectory/drift_trajectories_subplots.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-0.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-0.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-1.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-1.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-14B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-14B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-7B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_Qwen_Qwen2.5-7B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-2-13b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-2-13b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-2-7b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-2-7b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-3.1-8B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-3.1-8B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-3.2-1B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-3.2-1B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-3.2-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_meta-llama_Llama-3.2-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3-medium-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3-medium-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3-mini-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3-mini-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3-small-8k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3-small-8k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3.5-mini-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_Phi-3.5-mini-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_phi-4.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_microsoft_phi-4.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_mistralai_Mistral-7B-v0.1.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/decode_jsd_mistralai_Mistral-7B-v0.1.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/jsddiv_violin_plot.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/jsddiv_violin_plot.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/decode_jsd/normalized_decodejsd_subplots.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/decode_jsd/normalized_decodejsd_subplots.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-0.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-0.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-1.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-1.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-14B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-14B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-7B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_Qwen_Qwen2.5-7B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-2-13b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-2-13b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-2-7b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-2-7b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-3.1-8B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-3.1-8B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-3.2-1B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-3.2-1B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-3.2-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_meta-llama_Llama-3.2-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3-medium-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3-medium-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3-mini-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3-mini-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3-small-8k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3-small-8k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3.5-mini-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_Phi-3.5-mini-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_phi-4.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_microsoft_phi-4.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_mistralai_Mistral-7B-v0.1.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/headagreement_js_div/head_agreement_mistralai_Mistral-7B-v0.1.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-0.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-0.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-14B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-14B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-7B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_Qwen_Qwen2.5-7B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-2-13b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-2-13b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-2-7b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-2-7b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-3.1-8B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-3.1-8B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-3.2-1B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-3.2-1B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-3.2-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_meta-llama_Llama-3.2-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3-medium-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3-medium-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3-mini-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3-mini-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3-small-8k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3-small-8k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3.5-mini-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_Phi-3.5-mini-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_phi-4.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_microsoft_phi-4.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/decode_percdrift_mistralai_Mistral-7B-v0.1.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/decode_percdrift_mistralai_Mistral-7B-v0.1.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/percdrift/percdrift_violin_plot.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/percdrift/percdrift_violin_plot.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/head_agreement_violin_plot_all.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/head_agreement_violin_plot_all.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/head_agreement_violin_plot_mean.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/head_agreement_violin_plot_mean.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-0.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-0.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-14B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-14B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-7B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_Qwen_Qwen2.5-7B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-2-13b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-2-13b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-2-7b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-2-7b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-3.1-8B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-3.1-8B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-3.2-1B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-3.2-1B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-3.2-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_meta-llama_Llama-3.2-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_microsoft_Phi-3-medium-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_microsoft_Phi-3-medium-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_microsoft_Phi-3-mini-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_microsoft_Phi-3-mini-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_microsoft_Phi-3.5-mini-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_microsoft_Phi-3.5-mini-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_mistralai_Mistral-7B-v0.1.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/rankagreement_allheads/rank_agreement_mistralai_Mistral-7B-v0.1.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-0.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-0.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-1.5B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-1.5B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-14B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-14B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-7B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_Qwen_Qwen2.5-7B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-2-13b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-2-13b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-2-7b-hf.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-2-7b-hf.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-3.1-8B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-3.1-8B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-3.2-1B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-3.2-1B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-3.2-3B.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_meta-llama_Llama-3.2-3B.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3-medium-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3-medium-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3-mini-4k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3-mini-4k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3-small-8k-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3-small-8k-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3.5-mini-instruct.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_Phi-3.5-mini-instruct.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_phi-4.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_microsoft_phi-4.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_mistralai_Mistral-7B-v0.1.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/layer_consistency_mistralai_Mistral-7B-v0.1.npy -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/mean_js_divergence_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/mean_js_divergence_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/normalized_mean_js_divergence_per_layer.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/normalized_mean_js_divergence_per_layer.pdf -------------------------------------------------------------------------------- /ablation_results/ablation_plots/traces/tok_js_div/normalized_mean_js_divergence_subplots.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablation_plots/traces/tok_js_div/normalized_mean_js_divergence_subplots.pdf -------------------------------------------------------------------------------- /ablation_results/ablations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/ablations.py -------------------------------------------------------------------------------- /ablation_results/attn_weights_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/attn_weights_1.png -------------------------------------------------------------------------------- /ablation_results/combined_results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/combined_results.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L2_7B_2k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L2_7B_2k.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L3_1B_2k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L3_1B_2k.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L3_1B_2k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L3_1B_2k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L3_1B_2k_1PC_RAND.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L3_1B_2k_1PC_RAND.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L3_3B_2k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L3_3B_2k.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L3_3B_2k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L3_3B_2k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/L3_8B_1k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/L3_8B_1k.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/M7B_1k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/M7B_1k.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/P35mini_1k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/P35mini_1k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/P3mini_1k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/P3mini_1k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/csvresults/Q25_3B_2k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/csvresults/Q25_3B_2k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/drift_to_predacc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/drift_to_predacc.pdf -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_ABL_init.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_ABL_init.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_ABL_lookahead.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_ABL_lookahead.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_ABL_rand.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_ABL_rand.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_quest_P4.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_quest_P4.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L2_7B_2k_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L2_7B_2k_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_1PC_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_1PC_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_1PC_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_1PC_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_1PC_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_1PC_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_1PC_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_1PC_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_1PC_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_1PC_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_1B_2k_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_1B_2k_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_1PC_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_1PC_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_1PC_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_1PC_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_1PC_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_1PC_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_1PC_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_1PC_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_1PC_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_1PC_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_3B_2k_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_3B_2k_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k_quest_P4.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k_quest_P4.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/L3_8B_1k_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/L3_8B_1k_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/LongChat_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/LongChat_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/M7B_1k.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/M7B_1k.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/M7B_1k_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/M7B_1k_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/M7B_1k_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/M7B_1k_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/M7B_1k_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/M7B_1k_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/M7B_1k_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/M7B_1k_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/M7B_1k_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/M7B_1k_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P35mini_1k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P35mini_1k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P35mini_1k_1PC_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P35mini_1k_1PC_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P35mini_1k_1PC_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P35mini_1k_1PC_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P35mini_1k_1PC_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P35mini_1k_1PC_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P35mini_1k_1PC_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P35mini_1k_1PC_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P35mini_1k_1PC_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P35mini_1k_1PC_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P3mini_1k_1PC.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P3mini_1k_1PC.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P3mini_1k_1PC_h2o_true.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P3mini_1k_1PC_h2o_true.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P3mini_1k_1PC_oracle.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P3mini_1k_1PC_oracle.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P3mini_1k_1PC_quest.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P3mini_1k_1PC_quest.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P3mini_1k_1PC_snapkv.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P3mini_1k_1PC_snapkv.csv -------------------------------------------------------------------------------- /ablation_results/evalresults/P3mini_1k_1PC_streamingLLM.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/evalresults/P3mini_1k_1PC_streamingLLM.csv -------------------------------------------------------------------------------- /ablation_results/gen_data_stats.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/gen_data_stats.py -------------------------------------------------------------------------------- /ablation_results/gen_latex_collate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/gen_latex_collate.py -------------------------------------------------------------------------------- /ablation_results/graph_ablate_oracle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/graph_ablate_oracle.py -------------------------------------------------------------------------------- /ablation_results/graph_icml.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/graph_icml.py -------------------------------------------------------------------------------- /ablation_results/graph_methods.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/graph_methods.py -------------------------------------------------------------------------------- /ablation_results/graph_reasoning_result.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/graph_reasoning_result.py -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_0.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_0.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_1.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_1.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_2.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_2.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_3.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_3.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_4.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_4.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_5.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_5.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_6.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_6.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_7.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_7.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_8.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_8.tex -------------------------------------------------------------------------------- /ablation_results/latex_traces/generated_latex/latex_9.tex: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/latex_traces/generated_latex/latex_9.tex -------------------------------------------------------------------------------- /ablation_results/mask_ExpPred.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/mask_ExpPred.png -------------------------------------------------------------------------------- /ablation_results/mask_h2o_true.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/mask_h2o_true.png -------------------------------------------------------------------------------- /ablation_results/mask_oracle.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/mask_oracle.png -------------------------------------------------------------------------------- /ablation_results/mask_quest.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/mask_quest.png -------------------------------------------------------------------------------- /ablation_results/mrcr_results.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/mrcr_results.csv -------------------------------------------------------------------------------- /ablation_results/oracleablate_plots/average_acc_comparison.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/oracleablate_plots/average_acc_comparison.pdf -------------------------------------------------------------------------------- /ablation_results/oracleablate_plots/average_acc_comparison_percdiff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/oracleablate_plots/average_acc_comparison_percdiff.pdf -------------------------------------------------------------------------------- /ablation_results/oracleablate_plots/perplexity_comparison.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/oracleablate_plots/perplexity_comparison.pdf -------------------------------------------------------------------------------- /ablation_results/oracleablate_plots/perplexity_comparison_percdiff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/oracleablate_plots/perplexity_comparison_percdiff.pdf -------------------------------------------------------------------------------- /ablation_results/paramratios.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/paramratios.csv -------------------------------------------------------------------------------- /ablation_results/perf_results/attn_only_latency.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/perf_results/attn_only_latency.pdf -------------------------------------------------------------------------------- /ablation_results/plots/average_acc_comparison.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/plots/average_acc_comparison.pdf -------------------------------------------------------------------------------- /ablation_results/plots/average_acc_comparison_percdiff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/plots/average_acc_comparison_percdiff.pdf -------------------------------------------------------------------------------- /ablation_results/plots/perplexity_comparison.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/plots/perplexity_comparison.pdf -------------------------------------------------------------------------------- /ablation_results/plots/perplexity_comparison_percdiff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/plots/perplexity_comparison_percdiff.pdf -------------------------------------------------------------------------------- /ablation_results/pred_overhead.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/pred_overhead.csv -------------------------------------------------------------------------------- /ablation_results/pred_overhead_werr.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/pred_overhead_werr.csv -------------------------------------------------------------------------------- /ablation_results/predonly_overhead.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/predonly_overhead.pdf -------------------------------------------------------------------------------- /ablation_results/reasoning_result.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/reasoning_result.csv -------------------------------------------------------------------------------- /ablation_results/reasoning_results_plots.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/reasoning_results_plots.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_1pc_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_1pc_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama1b_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama1b_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_1pc_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_1pc_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama3b_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama3b_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama7b_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama7b_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/llama8b_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/llama8b_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/mistral7b_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/mistral7b_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi35mini_1pc_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi35mini_1pc_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/arceasy_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/arceasy_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/average.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/average.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/average_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/average_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/hellaswag_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/hellaswag_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/perplexity.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/perplexity.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/piqa_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/piqa_acc.pdf -------------------------------------------------------------------------------- /ablation_results/result_graphs/phi3mini_1pc_results/winogrande_acc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/result_graphs/phi3mini_1pc_results/winogrande_acc.pdf -------------------------------------------------------------------------------- /ablation_results/results/results_perc/arceasy_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/results/results_perc/arceasy_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/results/results_perc/hellaswag_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/results/results_perc/hellaswag_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/results/results_perc/piqa_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/results/results_perc/piqa_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/results/results_perc/winogrande_pct_diff.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/results/results_perc/winogrande_pct_diff.pdf -------------------------------------------------------------------------------- /ablation_results/threshold_calib_graph.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/threshold_calib_graph.py -------------------------------------------------------------------------------- /ablation_results/tokhitacc.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/tokhitacc.csv -------------------------------------------------------------------------------- /ablation_results/tokhitacc.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/tokhitacc.pdf -------------------------------------------------------------------------------- /ablation_results/tokhitacc_stacked.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/tokhitacc_stacked.pdf -------------------------------------------------------------------------------- /ablation_results/traj_drift_to_tokhitacc.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/ablation_results/traj_drift_to_tokhitacc.csv -------------------------------------------------------------------------------- /accelerator_configs/default_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/accelerator_configs/default_config.yaml -------------------------------------------------------------------------------- /accelerator_configs/fsdp_config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/accelerator_configs/fsdp_config.yaml -------------------------------------------------------------------------------- /base_model_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/base_model_eval.py -------------------------------------------------------------------------------- /base_sentences.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/base_sentences.py -------------------------------------------------------------------------------- /config/huggyllama/llama-7b.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/huggyllama/llama-7b.json -------------------------------------------------------------------------------- /config/lmsys/vicuna-7b-v1.5-16k.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/lmsys/vicuna-7b-v1.5-16k.json -------------------------------------------------------------------------------- /config/merge_config.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/merge_config.py -------------------------------------------------------------------------------- /config/meta-llama/Llama-2-70b-chat-hf.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/meta-llama/Llama-2-70b-chat-hf.json -------------------------------------------------------------------------------- /config/meta-llama/Llama-2-70b-hf.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/meta-llama/Llama-2-70b-hf.json -------------------------------------------------------------------------------- /config/meta-llama/Llama-2-7b-chat-hf.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/meta-llama/Llama-2-7b-chat-hf.json -------------------------------------------------------------------------------- /config/meta-llama/Llama-2-7b-hf.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/meta-llama/Llama-2-7b-hf.json -------------------------------------------------------------------------------- /config/meta-llama/Meta-Llama-3.1-8B.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/meta-llama/Meta-Llama-3.1-8B.json -------------------------------------------------------------------------------- /config/mistralai/Mistral-7B-v0.1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/mistralai/Mistral-7B-v0.1.json -------------------------------------------------------------------------------- /config/mistralai/Mixtral-8x7B-v0.1.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/config/mistralai/Mixtral-8x7B-v0.1.json -------------------------------------------------------------------------------- /d_sparsity_env.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/d_sparsity_env.yml -------------------------------------------------------------------------------- /figs/datasetfig.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/figs/datasetfig.png -------------------------------------------------------------------------------- /figs/mainfig.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/figs/mainfig.png -------------------------------------------------------------------------------- /figs/tokenbutlerlogo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/figs/tokenbutlerlogo.png -------------------------------------------------------------------------------- /longbench_utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longbench_utils/__init__.py -------------------------------------------------------------------------------- /longbench_utils/config/dataset2maxlen.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longbench_utils/config/dataset2maxlen.json -------------------------------------------------------------------------------- /longbench_utils/config/dataset2prompt.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longbench_utils/config/dataset2prompt.json -------------------------------------------------------------------------------- /longbench_utils/config/model2maxlen.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longbench_utils/config/model2maxlen.json -------------------------------------------------------------------------------- /longbench_utils/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longbench_utils/metrics.py -------------------------------------------------------------------------------- /longbench_utils/scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longbench_utils/scorer.py -------------------------------------------------------------------------------- /longeval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /longeval/data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /longeval/data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/dataset.py -------------------------------------------------------------------------------- /longeval/data/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/metrics.py -------------------------------------------------------------------------------- /longeval/data/niah/viz.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/niah/viz.py -------------------------------------------------------------------------------- /longeval/data/ruler/create_dataset.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/create_dataset.sh -------------------------------------------------------------------------------- /longeval/data/ruler/prepare.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/prepare.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic.yaml -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/common_words_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/common_words_extraction.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/constants.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/freq_words_extraction.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/freq_words_extraction.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/json/PaulGrahamEssays_URLs.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/json/PaulGrahamEssays_URLs.txt -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/json/download_paulgraham_essay.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/json/download_paulgraham_essay.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/json/download_qa_dataset.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/json/download_qa_dataset.sh -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/niah.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/niah.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/niah_multiturn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/niah_multiturn.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/qa.py -------------------------------------------------------------------------------- /longeval/data/ruler/synthetic/variable_tracking.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/synthetic/variable_tracking.py -------------------------------------------------------------------------------- /longeval/data/ruler/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/ruler/tokenizer.py -------------------------------------------------------------------------------- /longeval/data/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/data/utils.py -------------------------------------------------------------------------------- /longeval/eval_acc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/eval_acc.py -------------------------------------------------------------------------------- /longeval/eval_tokenbutler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/eval_tokenbutler.py -------------------------------------------------------------------------------- /longeval/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/longeval/evaluator.py -------------------------------------------------------------------------------- /main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/main.py -------------------------------------------------------------------------------- /main_scripts.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/main_scripts.sh -------------------------------------------------------------------------------- /modify_models/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /modify_models/modify_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_llama.py -------------------------------------------------------------------------------- /modify_models/modify_llama_baselines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_llama_baselines.py -------------------------------------------------------------------------------- /modify_models/modify_llama_performance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_llama_performance.py -------------------------------------------------------------------------------- /modify_models/modify_mistral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_mistral.py -------------------------------------------------------------------------------- /modify_models/modify_mistral_baselines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_mistral_baselines.py -------------------------------------------------------------------------------- /modify_models/modify_phi3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_phi3.py -------------------------------------------------------------------------------- /modify_models/modify_phi3_baselines.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_phi3_baselines.py -------------------------------------------------------------------------------- /modify_models/modify_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/modify_models/modify_qwen.py -------------------------------------------------------------------------------- /mrcr_custom.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/mrcr_custom.json -------------------------------------------------------------------------------- /predictor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/predictor.py -------------------------------------------------------------------------------- /quickplot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/quickplot.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/generate_calibration.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/scripts/generate_calibration.sh -------------------------------------------------------------------------------- /scripts/long_finetune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/scripts/long_finetune.sh -------------------------------------------------------------------------------- /scripts/testgen.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/scripts/testgen.sh -------------------------------------------------------------------------------- /scripts/train_predictors.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/scripts/train_predictors.sh -------------------------------------------------------------------------------- /test_generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/test_generation.py -------------------------------------------------------------------------------- /test_hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/test_hf.py -------------------------------------------------------------------------------- /triton_kernels/flash_attn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/triton_kernels/flash_attn.py -------------------------------------------------------------------------------- /triton_kernels/flash_attn_mse_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/triton_kernels/flash_attn_mse_loss.py -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/abdelfattah-lab/TokenButler/HEAD/utils.py --------------------------------------------------------------------------------