├── .gitignore ├── LICENSE ├── README.md ├── args.py ├── check_param_num.py ├── collect_reports.py ├── efficiency_test.py ├── efficiency_test_llama.py ├── environment.yml ├── eval ├── dispatch_openai_requests.py ├── mmlu │ ├── categories.py │ └── run_eval.py ├── truthfulqa │ └── run_eval.py └── utils.py ├── evaluate.py ├── figures └── APT_arch.png ├── loralib ├── __init__.py ├── layers.py └── utils.py ├── merge_llama_model_lora.py ├── merge_model_lora.py ├── models ├── __init__.py ├── l0_module.py ├── model_args.py ├── modeling_bert.py ├── modeling_llama.py ├── modeling_mt5.py ├── modeling_outputs.py ├── modeling_roberta.py └── modeling_t5.py ├── plot.py ├── plot ├── plot_radar.py ├── plot_salience_and_kurtosis.py ├── plot_salience_history.py ├── plot_tradeoff.py ├── plot_tradeoff_scatter.py └── plot_tta.py ├── post_analysis.py ├── post_training_prune.py ├── post_training_seq2seq_prune.py ├── post_training_sft_prune.py ├── post_training_squad_prune.py ├── prune ├── __init__.py ├── fisher.py ├── pruner.py ├── rearrange.py ├── rescale.py ├── scheduler.py ├── scorer.py └── search.py ├── requirements.txt ├── run.sh ├── run_alpaca_eval.py ├── run_eval_llama_mmlu.py ├── run_glue_multigpu.sh ├── run_llama_sft.py ├── run_minus_seq2seq_training.py ├── run_minus_squad_training.py ├── run_minus_training.py ├── run_pruning.py ├── scripts ├── ablation │ ├── roberta_base_mnli_distillation.sh │ ├── roberta_base_mnli_ft_teacher.sh │ ├── roberta_base_mnli_no_expand.sh │ ├── roberta_base_mnli_uniform_expand.sh │ ├── roberta_base_sst2_distillation.sh │ ├── roberta_base_sst2_ft_teacher.sh │ ├── roberta_base_sst2_lora_teacher.sh │ ├── roberta_base_sst2_no_expand.sh │ └── roberta_base_sst2_uniform_expand.sh ├── adaptpruning │ ├── bert_base_cola_momentum.sh │ ├── bert_base_mnli_momentum.sh │ ├── bert_base_mnli_momentum_noffnstart.sh │ ├── bert_base_mrpc_momentum.sh │ ├── bert_base_qnli_momentum.sh │ ├── bert_base_qqp_momentum.sh │ ├── bert_base_rte_momentum.sh │ ├── bert_base_squad_momentum.sh │ ├── bert_base_squad_momentum_noffnstart.sh │ ├── bert_base_sst2_momentum.sh │ ├── bert_base_sst2_momentum_noffnstart.sh │ ├── bert_base_stsb_momentum.sh │ ├── llama_2_13b_alpaca_gpt4.sh │ ├── llama_2_7b_alpaca_gpt4.sh │ ├── mt5_base_wmt_enro_momentum.sh │ ├── mt5_base_wmt_roen_momentum.sh │ ├── roberta_base_cola_momentum.sh │ ├── roberta_base_mnli_momentum.sh │ ├── roberta_base_mrpc_momentum.sh │ ├── roberta_base_qnli_momentum.sh │ ├── roberta_base_qqp_momentum.sh │ ├── roberta_base_rte_momentum.sh │ ├── roberta_base_squad_momentum.sh │ ├── roberta_base_squadv2_momentum.sh │ ├── roberta_base_sst2_momentum.sh │ ├── roberta_base_sst2_momentum_noffnstart.sh │ ├── roberta_base_stsb_momentum.sh │ ├── t5_base_lm_adapt_cnndm_momentum.sh │ ├── t5_base_lm_adapt_mnli_momentum.sh │ ├── t5_base_lm_adapt_sst2_momentum.sh │ ├── t5_base_xsum_momentum.sh │ ├── t5_xl_lm_adapt_sst2_momentum.sh │ ├── t5_xl_lm_adapt_sst2_momentum_larger.sh │ └── t5_xl_lm_adapt_sst2_momentum_noffnstart.sh ├── adaptpruning_nodistill │ ├── bert_base_mnli.sh │ ├── bert_base_squad.sh │ ├── bert_base_sst2.sh │ ├── llama_13b_alpaca_cleaned_preprune.sh │ ├── llama_2_13b_alpaca_gpt4.sh │ ├── llama_2_13b_alpaca_gpt4_noexpand.sh │ ├── llama_2_13b_alpaca_gpt4_preprune.sh │ ├── llama_2_13b_alpaca_gpt4_preprune_noexpand.sh │ ├── llama_2_7b_alpaca_gpt4.sh │ ├── llama_2_7b_alpaca_gpt4_noexpand.sh │ ├── llama_2_7b_alpaca_gpt4_preprune.sh │ ├── llama_2_7b_alpaca_gpt4_preprune_noexpand.sh │ ├── llama_7b_alpaca_cleaned_preprune.sh │ ├── llama_7b_alpaca_gpt4_preprune.sh │ ├── roberta_base_mnli.sh │ ├── roberta_base_squad.sh │ ├── roberta_base_sst2.sh │ ├── t5_base_lm_adapt_mnli.sh │ ├── t5_base_lm_adapt_sst2.sh │ └── t5_xl_lm_adapt_sst2.sh ├── efficiency_testing.sh ├── efficiency_testing_llama.sh ├── eval.sh ├── eval │ ├── alpaca_eval.sh │ ├── cnndm.sh │ ├── mmlu.sh │ ├── query_alpaca_eval.sh │ ├── truthfulqa.sh │ ├── wmt_enro.sh │ └── xsum.sh ├── eval_lora_roberta_mnli.sh ├── eval_multiple_lora_roberta_mnli.sh ├── ft │ ├── bert_base_mnli.sh │ ├── bert_base_squad.sh │ ├── bert_base_sst2.sh │ ├── llama_2_7b_alpaca_gpt4.sh │ ├── roberta_base_mnli.sh │ ├── roberta_base_squad.sh │ ├── roberta_base_squadv2.sh │ ├── roberta_base_sst2.sh │ ├── t5_base_lm_adapt_cnndm.sh │ ├── t5_base_lm_adapt_sst2.sh │ ├── t5_base_xsum.sh │ └── t5_xl_lm_adapt_sst2.sh ├── hyperparameter_searching │ ├── test_cutoff_prune_step.sh │ ├── test_distill.sh │ ├── test_distill_fisher.sh │ ├── test_distill_shorter.sh │ ├── test_once_prune_step.sh │ ├── test_once_rescaled.sh │ ├── test_throughout_prune.sh │ └── test_training_hypers.sh ├── lora │ ├── bert_base_mnli.sh │ ├── bert_base_squad.sh │ ├── bert_base_sst2.sh │ ├── llama_13b_alpaca_cleaned.sh │ ├── llama_2_13b_alpaca_gpt4.sh │ ├── llama_2_7b_alpaca_gpt4.sh │ ├── llama_7b_alpaca_cleaned.sh │ ├── mt5_base_wmt_enro.sh │ ├── mt5_base_wmt_roen.sh │ ├── roberta_base_cola.sh │ ├── roberta_base_mnli.sh │ ├── roberta_base_mrpc.sh │ ├── roberta_base_qnli.sh │ ├── roberta_base_qqp.sh │ ├── roberta_base_rte.sh │ ├── roberta_base_squad.sh │ ├── roberta_base_squadv2.sh │ ├── roberta_base_sst2.sh │ ├── roberta_base_stsb.sh │ ├── t5_base_lm_adapt_cnndm.sh │ ├── t5_base_lm_adapt_mnli.sh │ ├── t5_base_lm_adapt_sst2.sh │ ├── t5_base_xsum.sh │ ├── t5_xl_lm_adapt_cnndm.sh │ └── t5_xl_lm_adapt_sst2.sh ├── main_results │ └── bert_glue_big_momentum.sh ├── merge_llama_lora.sh ├── merge_lora.sh ├── post_training_cnndm_prune.sh ├── post_training_prune.sh ├── post_training_sft_prune.sh ├── post_training_squad_prune.sh ├── post_training_wmt_prune.sh ├── prepare_data.sh ├── sbatch_scripts │ ├── elastictuning │ │ ├── bert_base_squad_selfmomentum_noffnstart.sh │ │ ├── roberta_base_mnli_selfmomentum.sh │ │ ├── roberta_base_squadv2_selfmomentum.sh │ │ ├── roberta_base_sst2_selfmomentum_noffnstart.sh │ │ ├── t5_base_lm_adapt_sst2_selfmomentum.sh │ │ └── t5_xl_lm_adapt_sst2_selfmomentum.sh │ ├── ft │ │ ├── bert_base_sst2.sbatch │ │ └── roberta_base_sst2.sbatch │ ├── lora │ │ ├── bert_base_sst2.sbatch │ │ ├── roberta_base_mnli.sbatch │ │ ├── roberta_base_squad.sbatch │ │ └── roberta_base_sst2.sbatch │ ├── submit_job.sbatch │ └── submit_job_a100.sbatch ├── test_fisher_prune.sh ├── test_pruning_efficiency.sh ├── test_random_prune.sh ├── tradeoff │ ├── llama_alpaca_pruning.sh │ ├── mt5_base_lora_tradeoff.sh │ ├── roberta_base_ft_mask_tuning.sh │ ├── roberta_base_mask_tuning.sh │ ├── roberta_base_sst2.sh │ ├── roberta_base_sst2_expand.sh │ ├── roberta_base_sst2_expand_noffn.sh │ ├── roberta_base_sst2_tuning.sh │ └── t5_base_lm_adapt_lora_tradeoff.sh ├── train_ft.sh ├── train_ft_distill.sh ├── train_ft_distill_seq2seq.sh ├── train_ft_seq2seq.sh ├── train_lora.sh ├── train_lora_distill.sh ├── train_lora_distill_seq2seq.sh ├── train_lora_distill_squadv2.sh ├── train_lora_minus.sh ├── train_lora_minus_nodistill.sh ├── train_lora_seq2seq.sh ├── train_lora_sft.sh ├── train_lora_squad.sh ├── train_lora_squadv2.sh └── train_lora_wmt.sh ├── test ├── compare_tuning_freeze_fisher.py ├── test_adapt_pruning.py ├── test_awq.py ├── test_backward_scorer.py ├── test_bert.py ├── test_bert_salience.py ├── test_bert_self_momentum.py ├── test_bert_squad.py ├── test_block_normalize.py ├── test_cofi.py ├── test_conditional_pruning.py ├── test_continuous_pruning.py ├── test_deepcopy.py ├── test_deepspeed_profiler.py ├── test_distill_lora_layer.py ├── test_distill_svd.py ├── test_distill_with_reallocation.py ├── test_dynamic_adapter.py ├── test_fisher_pruning.py ├── test_fisher_scores.py ├── test_further_ft.py ├── test_gpu_base_speed.py ├── test_hidden_mask.py ├── test_hidden_states_grad.py ├── test_joint_salience.py ├── test_layer_conversion.py ├── test_llama.py ├── test_llama_backward_scorer.py ├── test_llama_bf16_distill.py ├── test_llama_efficiency.py ├── test_llama_elastictuning.py ├── test_llama_kurtosis.py ├── test_llama_mask_tuning.py ├── test_llama_pre_tuning_prune.py ├── test_llama_prune_strategies.py ├── test_llama_pruned_mmlu_eval.py ├── test_llama_virtualprune.py ├── test_magnitude_scorer.py ├── test_mask_efficiency.py ├── test_memory_usage.py ├── test_model_architecture.py ├── test_model_efficiency.py ├── test_model_grafting.py ├── test_model_prune_recover.py ├── test_moving_salience.py ├── test_neuron_importance.py ├── test_new_continuous_pruning.py ├── test_normalized_fisher.py ├── test_optimizer_state_passing.py ├── test_param_consistency.py ├── test_param_controller.py ├── test_param_tuning.py ├── test_pre_tuning_prune.py ├── test_pre_tuning_prune_t5_3b.py ├── test_prune_consistency.py ├── test_prune_pruned_model.py ├── test_pruned_model.py ├── test_pruned_teacher_training.py ├── test_pruning_linear.py ├── test_rewarmup_lr_scheduling.py ├── test_salience.py ├── test_self_distillation.py ├── test_sequential_pruning.py ├── test_specialize_layer_tuning.py ├── test_squad.py ├── test_t5.py ├── test_t5_3b.py ├── test_t5_3b_pretuning_prune.py ├── test_t5_backward_scorer.py ├── test_t5_efficiency.py ├── test_t5_glue.py ├── test_t5_hidden_states_grad.py ├── test_t5_hidden_z.py ├── test_t5_lm_adapt.py ├── test_t5_lm_adapt_elastictuning.py ├── test_t5_prune_consistency.py ├── test_t5_running.py ├── test_t5_self_distillation.py ├── test_t5_self_momentum.py ├── test_t5_virtual_prune.py ├── test_t5_virtual_prune_with_backward_scorer.py ├── test_t5_xsum.py ├── test_teacher_accuracy.py ├── test_teacher_updating.py ├── test_tensor_mask_transformation.py ├── test_top_down_pruning.py ├── test_torch_gradient.py ├── test_virtual_pruning_tuning.py └── test_weight_restoration.py ├── time_to_accuracy.py ├── trainer ├── allocation_strategy.py ├── model_arch.py ├── param_control.py ├── trainer_minus.py ├── trainer_qa_minus.py └── trainer_seq2seq_minus.py └── utils ├── __init__.py ├── alpaca_utils.py ├── analysis_utils.py ├── cofi_utils.py ├── fisher_utils ├── arch.py ├── efficiency │ ├── latency.py │ ├── mac.py │ ├── mem.py │ └── param.py ├── linalg.py ├── meter.py ├── schedule.py └── timer.py ├── minus_utils.py ├── plot_utils.py ├── qa_utils.py └── utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/README.md -------------------------------------------------------------------------------- /args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/args.py -------------------------------------------------------------------------------- /check_param_num.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/check_param_num.py -------------------------------------------------------------------------------- /collect_reports.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/collect_reports.py -------------------------------------------------------------------------------- /efficiency_test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/efficiency_test.py -------------------------------------------------------------------------------- /efficiency_test_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/efficiency_test_llama.py -------------------------------------------------------------------------------- /environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/environment.yml -------------------------------------------------------------------------------- /eval/dispatch_openai_requests.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/eval/dispatch_openai_requests.py -------------------------------------------------------------------------------- /eval/mmlu/categories.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/eval/mmlu/categories.py -------------------------------------------------------------------------------- /eval/mmlu/run_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/eval/mmlu/run_eval.py -------------------------------------------------------------------------------- /eval/truthfulqa/run_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/eval/truthfulqa/run_eval.py -------------------------------------------------------------------------------- /eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/eval/utils.py -------------------------------------------------------------------------------- /evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/evaluate.py -------------------------------------------------------------------------------- /figures/APT_arch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/figures/APT_arch.png -------------------------------------------------------------------------------- /loralib/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/loralib/__init__.py -------------------------------------------------------------------------------- /loralib/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/loralib/layers.py -------------------------------------------------------------------------------- /loralib/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/loralib/utils.py -------------------------------------------------------------------------------- /merge_llama_model_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/merge_llama_model_lora.py -------------------------------------------------------------------------------- /merge_model_lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/merge_model_lora.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/__init__.py -------------------------------------------------------------------------------- /models/l0_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/l0_module.py -------------------------------------------------------------------------------- /models/model_args.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/model_args.py -------------------------------------------------------------------------------- /models/modeling_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/modeling_bert.py -------------------------------------------------------------------------------- /models/modeling_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/modeling_llama.py -------------------------------------------------------------------------------- /models/modeling_mt5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/modeling_mt5.py -------------------------------------------------------------------------------- /models/modeling_outputs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/modeling_outputs.py -------------------------------------------------------------------------------- /models/modeling_roberta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/modeling_roberta.py -------------------------------------------------------------------------------- /models/modeling_t5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/models/modeling_t5.py -------------------------------------------------------------------------------- /plot.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot.py -------------------------------------------------------------------------------- /plot/plot_radar.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot/plot_radar.py -------------------------------------------------------------------------------- /plot/plot_salience_and_kurtosis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot/plot_salience_and_kurtosis.py -------------------------------------------------------------------------------- /plot/plot_salience_history.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot/plot_salience_history.py -------------------------------------------------------------------------------- /plot/plot_tradeoff.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot/plot_tradeoff.py -------------------------------------------------------------------------------- /plot/plot_tradeoff_scatter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot/plot_tradeoff_scatter.py -------------------------------------------------------------------------------- /plot/plot_tta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/plot/plot_tta.py -------------------------------------------------------------------------------- /post_analysis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/post_analysis.py -------------------------------------------------------------------------------- /post_training_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/post_training_prune.py -------------------------------------------------------------------------------- /post_training_seq2seq_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/post_training_seq2seq_prune.py -------------------------------------------------------------------------------- /post_training_sft_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/post_training_sft_prune.py -------------------------------------------------------------------------------- /post_training_squad_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/post_training_squad_prune.py -------------------------------------------------------------------------------- /prune/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/__init__.py -------------------------------------------------------------------------------- /prune/fisher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/fisher.py -------------------------------------------------------------------------------- /prune/pruner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/pruner.py -------------------------------------------------------------------------------- /prune/rearrange.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/rearrange.py -------------------------------------------------------------------------------- /prune/rescale.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/rescale.py -------------------------------------------------------------------------------- /prune/scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/scheduler.py -------------------------------------------------------------------------------- /prune/scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/scorer.py -------------------------------------------------------------------------------- /prune/search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/prune/search.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/requirements.txt -------------------------------------------------------------------------------- /run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run.sh -------------------------------------------------------------------------------- /run_alpaca_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_alpaca_eval.py -------------------------------------------------------------------------------- /run_eval_llama_mmlu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_eval_llama_mmlu.py -------------------------------------------------------------------------------- /run_glue_multigpu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_glue_multigpu.sh -------------------------------------------------------------------------------- /run_llama_sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_llama_sft.py -------------------------------------------------------------------------------- /run_minus_seq2seq_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_minus_seq2seq_training.py -------------------------------------------------------------------------------- /run_minus_squad_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_minus_squad_training.py -------------------------------------------------------------------------------- /run_minus_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_minus_training.py -------------------------------------------------------------------------------- /run_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/run_pruning.py -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_mnli_distillation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_mnli_distillation.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_mnli_ft_teacher.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_mnli_ft_teacher.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_mnli_no_expand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_mnli_no_expand.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_mnli_uniform_expand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_mnli_uniform_expand.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_sst2_distillation.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_sst2_distillation.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_sst2_ft_teacher.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_sst2_ft_teacher.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_sst2_lora_teacher.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_sst2_lora_teacher.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_sst2_no_expand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_sst2_no_expand.sh -------------------------------------------------------------------------------- /scripts/ablation/roberta_base_sst2_uniform_expand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ablation/roberta_base_sst2_uniform_expand.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_cola_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_cola_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_mnli_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_mnli_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_mnli_momentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_mnli_momentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_mrpc_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_mrpc_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_qnli_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_qnli_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_qqp_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_qqp_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_rte_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_rte_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_squad_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_squad_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_squad_momentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_squad_momentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_sst2_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_sst2_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_sst2_momentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_sst2_momentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/bert_base_stsb_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/bert_base_stsb_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/llama_2_13b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/llama_2_13b_alpaca_gpt4.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/llama_2_7b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/llama_2_7b_alpaca_gpt4.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/mt5_base_wmt_enro_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/mt5_base_wmt_enro_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/mt5_base_wmt_roen_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/mt5_base_wmt_roen_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_cola_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_cola_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_mnli_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_mnli_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_mrpc_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_mrpc_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_qnli_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_qnli_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_qqp_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_qqp_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_rte_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_rte_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_squad_momentum.sh: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_squadv2_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_squadv2_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_sst2_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_sst2_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_sst2_momentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_sst2_momentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/roberta_base_stsb_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/roberta_base_stsb_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_base_lm_adapt_cnndm_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_base_lm_adapt_cnndm_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_base_lm_adapt_mnli_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_base_lm_adapt_mnli_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_base_lm_adapt_sst2_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_base_lm_adapt_sst2_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_base_xsum_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_base_xsum_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_xl_lm_adapt_sst2_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_xl_lm_adapt_sst2_momentum.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_xl_lm_adapt_sst2_momentum_larger.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_xl_lm_adapt_sst2_momentum_larger.sh -------------------------------------------------------------------------------- /scripts/adaptpruning/t5_xl_lm_adapt_sst2_momentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning/t5_xl_lm_adapt_sst2_momentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/bert_base_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/bert_base_mnli.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/bert_base_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/bert_base_squad.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/bert_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/bert_base_sst2.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_13b_alpaca_cleaned_preprune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_13b_alpaca_cleaned_preprune.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4_noexpand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4_noexpand.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4_preprune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4_preprune.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4_preprune_noexpand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_13b_alpaca_gpt4_preprune_noexpand.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4_noexpand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4_noexpand.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4_preprune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4_preprune.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4_preprune_noexpand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_2_7b_alpaca_gpt4_preprune_noexpand.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_7b_alpaca_cleaned_preprune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_7b_alpaca_cleaned_preprune.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/llama_7b_alpaca_gpt4_preprune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/llama_7b_alpaca_gpt4_preprune.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/roberta_base_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/roberta_base_mnli.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/roberta_base_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/roberta_base_squad.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/roberta_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/roberta_base_sst2.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/t5_base_lm_adapt_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/t5_base_lm_adapt_mnli.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/t5_base_lm_adapt_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/t5_base_lm_adapt_sst2.sh -------------------------------------------------------------------------------- /scripts/adaptpruning_nodistill/t5_xl_lm_adapt_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/adaptpruning_nodistill/t5_xl_lm_adapt_sst2.sh -------------------------------------------------------------------------------- /scripts/efficiency_testing.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/efficiency_testing.sh -------------------------------------------------------------------------------- /scripts/efficiency_testing_llama.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/efficiency_testing_llama.sh -------------------------------------------------------------------------------- /scripts/eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval.sh -------------------------------------------------------------------------------- /scripts/eval/alpaca_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/alpaca_eval.sh -------------------------------------------------------------------------------- /scripts/eval/cnndm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/cnndm.sh -------------------------------------------------------------------------------- /scripts/eval/mmlu.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/mmlu.sh -------------------------------------------------------------------------------- /scripts/eval/query_alpaca_eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/query_alpaca_eval.sh -------------------------------------------------------------------------------- /scripts/eval/truthfulqa.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/truthfulqa.sh -------------------------------------------------------------------------------- /scripts/eval/wmt_enro.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/wmt_enro.sh -------------------------------------------------------------------------------- /scripts/eval/xsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval/xsum.sh -------------------------------------------------------------------------------- /scripts/eval_lora_roberta_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval_lora_roberta_mnli.sh -------------------------------------------------------------------------------- /scripts/eval_multiple_lora_roberta_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/eval_multiple_lora_roberta_mnli.sh -------------------------------------------------------------------------------- /scripts/ft/bert_base_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/bert_base_mnli.sh -------------------------------------------------------------------------------- /scripts/ft/bert_base_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/bert_base_squad.sh -------------------------------------------------------------------------------- /scripts/ft/bert_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/bert_base_sst2.sh -------------------------------------------------------------------------------- /scripts/ft/llama_2_7b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /scripts/ft/roberta_base_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/roberta_base_mnli.sh -------------------------------------------------------------------------------- /scripts/ft/roberta_base_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/roberta_base_squad.sh -------------------------------------------------------------------------------- /scripts/ft/roberta_base_squadv2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/roberta_base_squadv2.sh -------------------------------------------------------------------------------- /scripts/ft/roberta_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/roberta_base_sst2.sh -------------------------------------------------------------------------------- /scripts/ft/t5_base_lm_adapt_cnndm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/t5_base_lm_adapt_cnndm.sh -------------------------------------------------------------------------------- /scripts/ft/t5_base_lm_adapt_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/t5_base_lm_adapt_sst2.sh -------------------------------------------------------------------------------- /scripts/ft/t5_base_xsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/t5_base_xsum.sh -------------------------------------------------------------------------------- /scripts/ft/t5_xl_lm_adapt_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/ft/t5_xl_lm_adapt_sst2.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_cutoff_prune_step.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_cutoff_prune_step.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_distill.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_distill.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_distill_fisher.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_distill_fisher.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_distill_shorter.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_distill_shorter.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_once_prune_step.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_once_prune_step.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_once_rescaled.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_once_rescaled.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_throughout_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_throughout_prune.sh -------------------------------------------------------------------------------- /scripts/hyperparameter_searching/test_training_hypers.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/hyperparameter_searching/test_training_hypers.sh -------------------------------------------------------------------------------- /scripts/lora/bert_base_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/bert_base_mnli.sh -------------------------------------------------------------------------------- /scripts/lora/bert_base_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/bert_base_squad.sh -------------------------------------------------------------------------------- /scripts/lora/bert_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/bert_base_sst2.sh -------------------------------------------------------------------------------- /scripts/lora/llama_13b_alpaca_cleaned.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/llama_13b_alpaca_cleaned.sh -------------------------------------------------------------------------------- /scripts/lora/llama_2_13b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/llama_2_13b_alpaca_gpt4.sh -------------------------------------------------------------------------------- /scripts/lora/llama_2_7b_alpaca_gpt4.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/llama_2_7b_alpaca_gpt4.sh -------------------------------------------------------------------------------- /scripts/lora/llama_7b_alpaca_cleaned.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/llama_7b_alpaca_cleaned.sh -------------------------------------------------------------------------------- /scripts/lora/mt5_base_wmt_enro.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/mt5_base_wmt_enro.sh -------------------------------------------------------------------------------- /scripts/lora/mt5_base_wmt_roen.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/mt5_base_wmt_roen.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_cola.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_cola.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_mnli.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_mrpc.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_mrpc.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_qnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_qnli.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_qqp.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_qqp.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_rte.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_rte.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_squad.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_squadv2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_squadv2.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_sst2.sh -------------------------------------------------------------------------------- /scripts/lora/roberta_base_stsb.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/roberta_base_stsb.sh -------------------------------------------------------------------------------- /scripts/lora/t5_base_lm_adapt_cnndm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/t5_base_lm_adapt_cnndm.sh -------------------------------------------------------------------------------- /scripts/lora/t5_base_lm_adapt_mnli.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/t5_base_lm_adapt_mnli.sh -------------------------------------------------------------------------------- /scripts/lora/t5_base_lm_adapt_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/t5_base_lm_adapt_sst2.sh -------------------------------------------------------------------------------- /scripts/lora/t5_base_xsum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/t5_base_xsum.sh -------------------------------------------------------------------------------- /scripts/lora/t5_xl_lm_adapt_cnndm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/t5_xl_lm_adapt_cnndm.sh -------------------------------------------------------------------------------- /scripts/lora/t5_xl_lm_adapt_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/lora/t5_xl_lm_adapt_sst2.sh -------------------------------------------------------------------------------- /scripts/main_results/bert_glue_big_momentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/main_results/bert_glue_big_momentum.sh -------------------------------------------------------------------------------- /scripts/merge_llama_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/merge_llama_lora.sh -------------------------------------------------------------------------------- /scripts/merge_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/merge_lora.sh -------------------------------------------------------------------------------- /scripts/post_training_cnndm_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/post_training_cnndm_prune.sh -------------------------------------------------------------------------------- /scripts/post_training_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/post_training_prune.sh -------------------------------------------------------------------------------- /scripts/post_training_sft_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/post_training_sft_prune.sh -------------------------------------------------------------------------------- /scripts/post_training_squad_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/post_training_squad_prune.sh -------------------------------------------------------------------------------- /scripts/post_training_wmt_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/post_training_wmt_prune.sh -------------------------------------------------------------------------------- /scripts/prepare_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/prepare_data.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/elastictuning/bert_base_squad_selfmomentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/elastictuning/bert_base_squad_selfmomentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/elastictuning/roberta_base_mnli_selfmomentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/elastictuning/roberta_base_mnli_selfmomentum.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/elastictuning/roberta_base_squadv2_selfmomentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/elastictuning/roberta_base_squadv2_selfmomentum.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/elastictuning/roberta_base_sst2_selfmomentum_noffnstart.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/elastictuning/roberta_base_sst2_selfmomentum_noffnstart.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/elastictuning/t5_base_lm_adapt_sst2_selfmomentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/elastictuning/t5_base_lm_adapt_sst2_selfmomentum.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/elastictuning/t5_xl_lm_adapt_sst2_selfmomentum.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/elastictuning/t5_xl_lm_adapt_sst2_selfmomentum.sh -------------------------------------------------------------------------------- /scripts/sbatch_scripts/ft/bert_base_sst2.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/ft/bert_base_sst2.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/ft/roberta_base_sst2.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/ft/roberta_base_sst2.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/lora/bert_base_sst2.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/lora/bert_base_sst2.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/lora/roberta_base_mnli.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/lora/roberta_base_mnli.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/lora/roberta_base_squad.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/lora/roberta_base_squad.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/lora/roberta_base_sst2.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/lora/roberta_base_sst2.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/submit_job.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/submit_job.sbatch -------------------------------------------------------------------------------- /scripts/sbatch_scripts/submit_job_a100.sbatch: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/sbatch_scripts/submit_job_a100.sbatch -------------------------------------------------------------------------------- /scripts/test_fisher_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/test_fisher_prune.sh -------------------------------------------------------------------------------- /scripts/test_pruning_efficiency.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/test_pruning_efficiency.sh -------------------------------------------------------------------------------- /scripts/test_random_prune.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/test_random_prune.sh -------------------------------------------------------------------------------- /scripts/tradeoff/llama_alpaca_pruning.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/llama_alpaca_pruning.sh -------------------------------------------------------------------------------- /scripts/tradeoff/mt5_base_lora_tradeoff.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/mt5_base_lora_tradeoff.sh -------------------------------------------------------------------------------- /scripts/tradeoff/roberta_base_ft_mask_tuning.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/roberta_base_ft_mask_tuning.sh -------------------------------------------------------------------------------- /scripts/tradeoff/roberta_base_mask_tuning.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/roberta_base_mask_tuning.sh -------------------------------------------------------------------------------- /scripts/tradeoff/roberta_base_sst2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/roberta_base_sst2.sh -------------------------------------------------------------------------------- /scripts/tradeoff/roberta_base_sst2_expand.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/roberta_base_sst2_expand.sh -------------------------------------------------------------------------------- /scripts/tradeoff/roberta_base_sst2_expand_noffn.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/roberta_base_sst2_expand_noffn.sh -------------------------------------------------------------------------------- /scripts/tradeoff/roberta_base_sst2_tuning.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/roberta_base_sst2_tuning.sh -------------------------------------------------------------------------------- /scripts/tradeoff/t5_base_lm_adapt_lora_tradeoff.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/tradeoff/t5_base_lm_adapt_lora_tradeoff.sh -------------------------------------------------------------------------------- /scripts/train_ft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_ft.sh -------------------------------------------------------------------------------- /scripts/train_ft_distill.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_ft_distill.sh -------------------------------------------------------------------------------- /scripts/train_ft_distill_seq2seq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_ft_distill_seq2seq.sh -------------------------------------------------------------------------------- /scripts/train_ft_seq2seq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_ft_seq2seq.sh -------------------------------------------------------------------------------- /scripts/train_lora.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora.sh -------------------------------------------------------------------------------- /scripts/train_lora_distill.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_distill.sh -------------------------------------------------------------------------------- /scripts/train_lora_distill_seq2seq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_distill_seq2seq.sh -------------------------------------------------------------------------------- /scripts/train_lora_distill_squadv2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_distill_squadv2.sh -------------------------------------------------------------------------------- /scripts/train_lora_minus.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_minus.sh -------------------------------------------------------------------------------- /scripts/train_lora_minus_nodistill.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_minus_nodistill.sh -------------------------------------------------------------------------------- /scripts/train_lora_seq2seq.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_seq2seq.sh -------------------------------------------------------------------------------- /scripts/train_lora_sft.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_sft.sh -------------------------------------------------------------------------------- /scripts/train_lora_squad.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_squad.sh -------------------------------------------------------------------------------- /scripts/train_lora_squadv2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_squadv2.sh -------------------------------------------------------------------------------- /scripts/train_lora_wmt.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/scripts/train_lora_wmt.sh -------------------------------------------------------------------------------- /test/compare_tuning_freeze_fisher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/compare_tuning_freeze_fisher.py -------------------------------------------------------------------------------- /test/test_adapt_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_adapt_pruning.py -------------------------------------------------------------------------------- /test/test_awq.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_awq.py -------------------------------------------------------------------------------- /test/test_backward_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_backward_scorer.py -------------------------------------------------------------------------------- /test/test_bert.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_bert.py -------------------------------------------------------------------------------- /test/test_bert_salience.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_bert_salience.py -------------------------------------------------------------------------------- /test/test_bert_self_momentum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_bert_self_momentum.py -------------------------------------------------------------------------------- /test/test_bert_squad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_bert_squad.py -------------------------------------------------------------------------------- /test/test_block_normalize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_block_normalize.py -------------------------------------------------------------------------------- /test/test_cofi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_cofi.py -------------------------------------------------------------------------------- /test/test_conditional_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_conditional_pruning.py -------------------------------------------------------------------------------- /test/test_continuous_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_continuous_pruning.py -------------------------------------------------------------------------------- /test/test_deepcopy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_deepcopy.py -------------------------------------------------------------------------------- /test/test_deepspeed_profiler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_deepspeed_profiler.py -------------------------------------------------------------------------------- /test/test_distill_lora_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_distill_lora_layer.py -------------------------------------------------------------------------------- /test/test_distill_svd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_distill_svd.py -------------------------------------------------------------------------------- /test/test_distill_with_reallocation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_distill_with_reallocation.py -------------------------------------------------------------------------------- /test/test_dynamic_adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_dynamic_adapter.py -------------------------------------------------------------------------------- /test/test_fisher_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_fisher_pruning.py -------------------------------------------------------------------------------- /test/test_fisher_scores.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_fisher_scores.py -------------------------------------------------------------------------------- /test/test_further_ft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_further_ft.py -------------------------------------------------------------------------------- /test/test_gpu_base_speed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_gpu_base_speed.py -------------------------------------------------------------------------------- /test/test_hidden_mask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_hidden_mask.py -------------------------------------------------------------------------------- /test/test_hidden_states_grad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_hidden_states_grad.py -------------------------------------------------------------------------------- /test/test_joint_salience.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_joint_salience.py -------------------------------------------------------------------------------- /test/test_layer_conversion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_layer_conversion.py -------------------------------------------------------------------------------- /test/test_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama.py -------------------------------------------------------------------------------- /test/test_llama_backward_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_backward_scorer.py -------------------------------------------------------------------------------- /test/test_llama_bf16_distill.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_bf16_distill.py -------------------------------------------------------------------------------- /test/test_llama_efficiency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_efficiency.py -------------------------------------------------------------------------------- /test/test_llama_elastictuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_elastictuning.py -------------------------------------------------------------------------------- /test/test_llama_kurtosis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_kurtosis.py -------------------------------------------------------------------------------- /test/test_llama_mask_tuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_mask_tuning.py -------------------------------------------------------------------------------- /test/test_llama_pre_tuning_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_pre_tuning_prune.py -------------------------------------------------------------------------------- /test/test_llama_prune_strategies.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_prune_strategies.py -------------------------------------------------------------------------------- /test/test_llama_pruned_mmlu_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_pruned_mmlu_eval.py -------------------------------------------------------------------------------- /test/test_llama_virtualprune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_llama_virtualprune.py -------------------------------------------------------------------------------- /test/test_magnitude_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_magnitude_scorer.py -------------------------------------------------------------------------------- /test/test_mask_efficiency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_mask_efficiency.py -------------------------------------------------------------------------------- /test/test_memory_usage.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_memory_usage.py -------------------------------------------------------------------------------- /test/test_model_architecture.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_model_architecture.py -------------------------------------------------------------------------------- /test/test_model_efficiency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_model_efficiency.py -------------------------------------------------------------------------------- /test/test_model_grafting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_model_grafting.py -------------------------------------------------------------------------------- /test/test_model_prune_recover.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_model_prune_recover.py -------------------------------------------------------------------------------- /test/test_moving_salience.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_moving_salience.py -------------------------------------------------------------------------------- /test/test_neuron_importance.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_neuron_importance.py -------------------------------------------------------------------------------- /test/test_new_continuous_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_new_continuous_pruning.py -------------------------------------------------------------------------------- /test/test_normalized_fisher.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_normalized_fisher.py -------------------------------------------------------------------------------- /test/test_optimizer_state_passing.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /test/test_param_consistency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_param_consistency.py -------------------------------------------------------------------------------- /test/test_param_controller.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_param_controller.py -------------------------------------------------------------------------------- /test/test_param_tuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_param_tuning.py -------------------------------------------------------------------------------- /test/test_pre_tuning_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_pre_tuning_prune.py -------------------------------------------------------------------------------- /test/test_pre_tuning_prune_t5_3b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_pre_tuning_prune_t5_3b.py -------------------------------------------------------------------------------- /test/test_prune_consistency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_prune_consistency.py -------------------------------------------------------------------------------- /test/test_prune_pruned_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_prune_pruned_model.py -------------------------------------------------------------------------------- /test/test_pruned_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_pruned_model.py -------------------------------------------------------------------------------- /test/test_pruned_teacher_training.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_pruned_teacher_training.py -------------------------------------------------------------------------------- /test/test_pruning_linear.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_pruning_linear.py -------------------------------------------------------------------------------- /test/test_rewarmup_lr_scheduling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_rewarmup_lr_scheduling.py -------------------------------------------------------------------------------- /test/test_salience.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_salience.py -------------------------------------------------------------------------------- /test/test_self_distillation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_self_distillation.py -------------------------------------------------------------------------------- /test/test_sequential_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_sequential_pruning.py -------------------------------------------------------------------------------- /test/test_specialize_layer_tuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_specialize_layer_tuning.py -------------------------------------------------------------------------------- /test/test_squad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_squad.py -------------------------------------------------------------------------------- /test/test_t5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5.py -------------------------------------------------------------------------------- /test/test_t5_3b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_3b.py -------------------------------------------------------------------------------- /test/test_t5_3b_pretuning_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_3b_pretuning_prune.py -------------------------------------------------------------------------------- /test/test_t5_backward_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_backward_scorer.py -------------------------------------------------------------------------------- /test/test_t5_efficiency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_efficiency.py -------------------------------------------------------------------------------- /test/test_t5_glue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_glue.py -------------------------------------------------------------------------------- /test/test_t5_hidden_states_grad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_hidden_states_grad.py -------------------------------------------------------------------------------- /test/test_t5_hidden_z.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_hidden_z.py -------------------------------------------------------------------------------- /test/test_t5_lm_adapt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_lm_adapt.py -------------------------------------------------------------------------------- /test/test_t5_lm_adapt_elastictuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_lm_adapt_elastictuning.py -------------------------------------------------------------------------------- /test/test_t5_prune_consistency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_prune_consistency.py -------------------------------------------------------------------------------- /test/test_t5_running.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_running.py -------------------------------------------------------------------------------- /test/test_t5_self_distillation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_self_distillation.py -------------------------------------------------------------------------------- /test/test_t5_self_momentum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_self_momentum.py -------------------------------------------------------------------------------- /test/test_t5_virtual_prune.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_virtual_prune.py -------------------------------------------------------------------------------- /test/test_t5_virtual_prune_with_backward_scorer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_virtual_prune_with_backward_scorer.py -------------------------------------------------------------------------------- /test/test_t5_xsum.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_t5_xsum.py -------------------------------------------------------------------------------- /test/test_teacher_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_teacher_accuracy.py -------------------------------------------------------------------------------- /test/test_teacher_updating.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_teacher_updating.py -------------------------------------------------------------------------------- /test/test_tensor_mask_transformation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_tensor_mask_transformation.py -------------------------------------------------------------------------------- /test/test_top_down_pruning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_top_down_pruning.py -------------------------------------------------------------------------------- /test/test_torch_gradient.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_torch_gradient.py -------------------------------------------------------------------------------- /test/test_virtual_pruning_tuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_virtual_pruning_tuning.py -------------------------------------------------------------------------------- /test/test_weight_restoration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/test/test_weight_restoration.py -------------------------------------------------------------------------------- /time_to_accuracy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/time_to_accuracy.py -------------------------------------------------------------------------------- /trainer/allocation_strategy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/trainer/allocation_strategy.py -------------------------------------------------------------------------------- /trainer/model_arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/trainer/model_arch.py -------------------------------------------------------------------------------- /trainer/param_control.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/trainer/param_control.py -------------------------------------------------------------------------------- /trainer/trainer_minus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/trainer/trainer_minus.py -------------------------------------------------------------------------------- /trainer/trainer_qa_minus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/trainer/trainer_qa_minus.py -------------------------------------------------------------------------------- /trainer/trainer_seq2seq_minus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/trainer/trainer_seq2seq_minus.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/__init__.py -------------------------------------------------------------------------------- /utils/alpaca_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/alpaca_utils.py -------------------------------------------------------------------------------- /utils/analysis_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/analysis_utils.py -------------------------------------------------------------------------------- /utils/cofi_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/cofi_utils.py -------------------------------------------------------------------------------- /utils/fisher_utils/arch.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/arch.py -------------------------------------------------------------------------------- /utils/fisher_utils/efficiency/latency.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/efficiency/latency.py -------------------------------------------------------------------------------- /utils/fisher_utils/efficiency/mac.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/efficiency/mac.py -------------------------------------------------------------------------------- /utils/fisher_utils/efficiency/mem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/efficiency/mem.py -------------------------------------------------------------------------------- /utils/fisher_utils/efficiency/param.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/efficiency/param.py -------------------------------------------------------------------------------- /utils/fisher_utils/linalg.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/linalg.py -------------------------------------------------------------------------------- /utils/fisher_utils/meter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/meter.py -------------------------------------------------------------------------------- /utils/fisher_utils/schedule.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/schedule.py -------------------------------------------------------------------------------- /utils/fisher_utils/timer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/fisher_utils/timer.py -------------------------------------------------------------------------------- /utils/minus_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/minus_utils.py -------------------------------------------------------------------------------- /utils/plot_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/plot_utils.py -------------------------------------------------------------------------------- /utils/qa_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/qa_utils.py -------------------------------------------------------------------------------- /utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ROIM1998/APT/HEAD/utils/utils.py --------------------------------------------------------------------------------