├── .gitignore ├── LICENSE.md ├── Readme.md ├── apply_delta.py ├── conf ├── base.yaml ├── llama │ ├── wiki │ │ ├── llama_13b_merit_v1_pv91_v91_v1_0.yaml │ │ ├── llama_30b_qlora_test.yaml │ │ ├── llama_65b_qlora_train_new.yaml │ │ ├── llama_7b_flan_v1_0.yaml │ │ ├── llama_7b_flan_v1_0_reclor_eval_prompt.yaml │ │ ├── llama_7b_flan_v1_1.yaml │ │ ├── llama_7b_flan_v1_1_ds.yaml │ │ ├── llama_7b_flan_v1_1_reclor_eval_prompt.yaml │ │ ├── llama_7b_flan_v1_2_ds.yaml │ │ ├── llama_7b_flan_v1_2_reclor_eval_prompt.yaml │ │ ├── llama_7b_flan_v1_3_ds.yaml │ │ ├── llama_7b_flan_v1_3_reclor_eval_prompt.yaml │ │ ├── llama_7b_flan_v1_4_ds.yaml │ │ ├── llama_7b_flan_v1_4_reclor_eval_prompt.yaml │ │ ├── llama_7b_merit_v1_pv91_v91_flan_v1_0_reclor_eval_prompt_v1_0.yaml │ │ ├── llama_7b_merit_v1_pv91_v91_v2_0.yaml │ │ ├── test.yaml │ │ ├── vicuna_7b_reclor_eval_prompt.yaml │ │ └── vicuna_7b_reclor_eval_prompt_v1_1.yaml │ └── zh │ │ ├── belle_7b_c3_d_eval_prompt_v1_0_test.yaml │ │ ├── belle_7b_c3_m_eval_prompt_v1_0_test.yaml │ │ ├── belle_7b_logiqav2_eval_prompt_v1_0_test.yaml │ │ ├── linly_7b_c3_d_eval_prompt_v1_0_test.yaml │ │ ├── linly_7b_c3_m_eval_prompt_v1_0_test.yaml │ │ ├── linly_7b_logiqav2_eval_prompt_v1_0_test.yaml │ │ ├── llama2_13b_zh_emb_pt_v1_0.yaml │ │ ├── llama2_13b_zh_sft_combine_v1_0_ds.yaml │ │ ├── llama2_13b_zh_v1_0_ds.yaml │ │ ├── llama2_13b_zh_v1_1_ds.yaml │ │ ├── llama2_13b_zh_v2_0_ds.yaml │ │ ├── llama2_13b_zh_v3_0_ds.yaml │ │ ├── llama_13b_zh_instruct_coig_sft_v1_0_ds.yaml │ │ ├── llama_13b_zh_instruct_sft_combine_v1_0_ds.yaml │ │ ├── llama_13b_zh_instruct_sft_combine_v1_1_ds.yaml │ │ ├── llama_13b_zh_instruct_v1_0_ds.yaml │ │ ├── llama_7b_zh_c3_eval_prompt_v1_0_test.yaml │ │ ├── llama_7b_zh_c3_m_eval_prompt_v1_0_test.yaml │ │ ├── llama_7b_zh_instruct_c3_eval_prompt_v1_0_test.yaml │ │ ├── llama_7b_zh_instruct_c3_m_eval_prompt_v1_0_test.yaml │ │ ├── llama_7b_zh_instruct_coig_sft_v1_0_ds.yaml │ │ ├── llama_7b_zh_instruct_v1_0_ds.yaml │ │ ├── llama_7b_zh_logiqav2_eval_prompt_v1_0.yaml │ │ ├── llama_7b_zh_logiqav2_eval_prompt_v1_0_test.yaml │ │ └── llama_open_7b_300bt_zh_v1_0_ds.yaml ├── mpt │ ├── mpt_30b_mp_test.yaml │ ├── mpt_30b_mp_v1_0.yaml │ ├── mpt_30b_mp_v1_1.yaml │ ├── mpt_30b_mp_v2_0_emb_pt.yaml │ ├── mpt_30b_mp_v2_1_emb_pt.yaml │ └── mpt_30b_mp_v2_2_emb_pt.yaml ├── roberta_split_fact_v1_1.yaml ├── template.yaml └── test │ └── llama_30b_merit_v1_pv91_v91_v5_0.yaml ├── convert2ckpt.py ├── convert2hf.py ├── data ├── __init__.py ├── collators │ ├── __init__.py │ ├── flan.py │ ├── misc.py │ ├── wiki_seq2seq_collator.py │ └── zh_instruct.py ├── data_utils.py ├── files │ ├── c4 │ │ └── en │ │ │ ├── p25 │ │ │ ├── partition_100.json │ │ │ ├── partition_1000.json │ │ │ ├── partition_1025.json │ │ │ ├── partition_125.json │ │ │ ├── partition_150.json │ │ │ ├── partition_175.json │ │ │ ├── partition_200.json │ │ │ ├── partition_225.json │ │ │ ├── partition_25.json │ │ │ ├── partition_250.json │ │ │ ├── partition_275.json │ │ │ ├── partition_300.json │ │ │ ├── partition_325.json │ │ │ ├── partition_350.json │ │ │ ├── partition_375.json │ │ │ ├── partition_400.json │ │ │ ├── partition_425.json │ │ │ ├── partition_450.json │ │ │ ├── partition_475.json │ │ │ ├── partition_50.json │ │ │ ├── partition_500.json │ │ │ ├── partition_525.json │ │ │ ├── partition_550.json │ │ │ ├── partition_575.json │ │ │ ├── partition_600.json │ │ │ ├── partition_625.json │ │ │ ├── partition_650.json │ │ │ ├── partition_675.json │ │ │ ├── partition_700.json │ │ │ ├── partition_725.json │ │ │ ├── partition_75.json │ │ │ ├── partition_750.json │ │ │ ├── partition_775.json │ │ │ ├── partition_800.json │ │ │ ├── partition_825.json │ │ │ ├── partition_850.json │ │ │ ├── partition_875.json │ │ │ ├── partition_900.json │ │ │ ├── partition_925.json │ │ │ ├── partition_950.json │ │ │ └── partition_975.json │ │ │ ├── p50 │ │ │ ├── partition_100.json │ │ │ ├── partition_1000.json │ │ │ ├── partition_1050.json │ │ │ ├── partition_150.json │ │ │ ├── partition_200.json │ │ │ ├── partition_250.json │ │ │ ├── partition_300.json │ │ │ ├── partition_350.json │ │ │ ├── partition_400.json │ │ │ ├── partition_450.json │ │ │ ├── partition_50.json │ │ │ ├── partition_500.json │ │ │ ├── partition_550.json │ │ │ ├── partition_600.json │ │ │ ├── partition_650.json │ │ │ ├── partition_700.json │ │ │ ├── partition_750.json │ │ │ ├── partition_800.json │ │ │ ├── partition_850.json │ │ │ ├── partition_900.json │ │ │ └── partition_950.json │ │ │ ├── partition_100.json │ │ │ ├── partition_1000.json │ │ │ ├── partition_1100.json │ │ │ ├── partition_200.json │ │ │ ├── partition_300.json │ │ │ ├── partition_400.json │ │ │ ├── partition_500.json │ │ │ ├── partition_600.json │ │ │ ├── partition_700.json │ │ │ ├── partition_800.json │ │ │ └── partition_900.json │ └── wudao │ │ ├── file_samples_50.json │ │ ├── partition_000.json │ │ ├── partition_100.json │ │ ├── partition_200.json │ │ ├── partition_300.json │ │ └── partition_400.json ├── flan_combine.py ├── flan_sample.py ├── flan_shuffle.py ├── mp_inputs_process.py ├── preprocessor │ ├── __init__.py │ └── mmlu_merge.py ├── readers.py ├── reclor_prompt.py ├── strategy_qa.py └── test.py ├── ds_inference.py ├── general_util ├── __init__.py ├── average_meter.py ├── dist_utils.py ├── evaluator.py ├── fsdp_utils.py ├── lightseq_utils.py ├── logger.py ├── metrics.py ├── mixin.py ├── tensorboard_helper.py ├── tokenization_utils.py ├── torch_fsdp_utils.py └── training_utils.py ├── make_delta.py ├── models ├── __init__.py ├── llama.py ├── llama_ds_mp_wrap.py ├── mpt │ ├── README.md │ ├── adapt_tokenizer.py │ ├── attention.py │ ├── blocks.py │ ├── config.json │ ├── configuration_mpt.py │ ├── custom_embedding.py │ ├── flash_attn_triton.py │ ├── generation_config.json │ ├── hf_prefixlm_converter.py │ ├── meta_init_context.py │ ├── modeling_mpt.py │ ├── norm.py │ ├── param_init_fns.py │ ├── pytorch_model.bin.index.json │ ├── special_tokens_map.json │ ├── tokenizer.json │ └── tokenizer_config.json ├── mpt_ds_mp_wrap.py ├── patching.py ├── patching_utils.py ├── roberta.py └── t5.py ├── modules ├── __init__.py ├── layers.py ├── logits_processor.py └── trie.py ├── mpt_convert2ckpt.py ├── panda_logo.PNG ├── post_processors ├── bleu.py ├── dist_mixin.py ├── erica_post_processor.py ├── reclor.py └── retrieval.py ├── requirements.txt ├── seed_multi_run.sh ├── trainer_base_ds_mp.py ├── trainer_base_ds_mp_aws.py ├── trainer_base_ds_mul.py ├── trainer_base_ds_mul_aws.py ├── trainer_base_ds_mul_tb.py ├── trainer_base_ds_v1.py ├── trainer_base_fsdp_mul.py ├── trainer_base_fsdp_v4.py ├── trainer_torch_fsdp.py ├── trainer_torch_fsdp_wandb.py └── unify_format.ipynb /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/LICENSE.md -------------------------------------------------------------------------------- /Readme.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/Readme.md -------------------------------------------------------------------------------- /apply_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/apply_delta.py -------------------------------------------------------------------------------- /conf/base.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/base.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_13b_merit_v1_pv91_v91_v1_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_13b_merit_v1_pv91_v91_v1_0.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_30b_qlora_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_30b_qlora_test.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_65b_qlora_train_new.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_65b_qlora_train_new.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_0.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_0_reclor_eval_prompt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_0_reclor_eval_prompt.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_1.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_1_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_1_ds.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_1_reclor_eval_prompt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_1_reclor_eval_prompt.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_2_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_2_ds.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_2_reclor_eval_prompt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_2_reclor_eval_prompt.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_3_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_3_ds.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_3_reclor_eval_prompt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_3_reclor_eval_prompt.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_4_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_4_ds.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_flan_v1_4_reclor_eval_prompt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_flan_v1_4_reclor_eval_prompt.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_merit_v1_pv91_v91_flan_v1_0_reclor_eval_prompt_v1_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_merit_v1_pv91_v91_flan_v1_0_reclor_eval_prompt_v1_0.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/llama_7b_merit_v1_pv91_v91_v2_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/llama_7b_merit_v1_pv91_v91_v2_0.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/test.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/vicuna_7b_reclor_eval_prompt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/vicuna_7b_reclor_eval_prompt.yaml -------------------------------------------------------------------------------- /conf/llama/wiki/vicuna_7b_reclor_eval_prompt_v1_1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/wiki/vicuna_7b_reclor_eval_prompt_v1_1.yaml -------------------------------------------------------------------------------- /conf/llama/zh/belle_7b_c3_d_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/belle_7b_c3_d_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/belle_7b_c3_m_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/belle_7b_c3_m_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/belle_7b_logiqav2_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/belle_7b_logiqav2_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/linly_7b_c3_d_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/linly_7b_c3_d_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/linly_7b_c3_m_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/linly_7b_c3_m_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/linly_7b_logiqav2_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/linly_7b_logiqav2_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama2_13b_zh_emb_pt_v1_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama2_13b_zh_emb_pt_v1_0.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama2_13b_zh_sft_combine_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama2_13b_zh_sft_combine_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama2_13b_zh_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama2_13b_zh_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama2_13b_zh_v1_1_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama2_13b_zh_v1_1_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama2_13b_zh_v2_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama2_13b_zh_v2_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama2_13b_zh_v3_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama2_13b_zh_v3_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_13b_zh_instruct_coig_sft_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_13b_zh_instruct_coig_sft_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_13b_zh_instruct_sft_combine_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_13b_zh_instruct_sft_combine_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_13b_zh_instruct_sft_combine_v1_1_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_13b_zh_instruct_sft_combine_v1_1_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_13b_zh_instruct_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_13b_zh_instruct_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_c3_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_c3_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_c3_m_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_c3_m_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_instruct_c3_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_instruct_c3_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_instruct_c3_m_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_instruct_c3_m_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_instruct_coig_sft_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_instruct_coig_sft_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_instruct_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_instruct_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_logiqav2_eval_prompt_v1_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_logiqav2_eval_prompt_v1_0.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_7b_zh_logiqav2_eval_prompt_v1_0_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_7b_zh_logiqav2_eval_prompt_v1_0_test.yaml -------------------------------------------------------------------------------- /conf/llama/zh/llama_open_7b_300bt_zh_v1_0_ds.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/llama/zh/llama_open_7b_300bt_zh_v1_0_ds.yaml -------------------------------------------------------------------------------- /conf/mpt/mpt_30b_mp_test.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/mpt/mpt_30b_mp_test.yaml -------------------------------------------------------------------------------- /conf/mpt/mpt_30b_mp_v1_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/mpt/mpt_30b_mp_v1_0.yaml -------------------------------------------------------------------------------- /conf/mpt/mpt_30b_mp_v1_1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/mpt/mpt_30b_mp_v1_1.yaml -------------------------------------------------------------------------------- /conf/mpt/mpt_30b_mp_v2_0_emb_pt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/mpt/mpt_30b_mp_v2_0_emb_pt.yaml -------------------------------------------------------------------------------- /conf/mpt/mpt_30b_mp_v2_1_emb_pt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/mpt/mpt_30b_mp_v2_1_emb_pt.yaml -------------------------------------------------------------------------------- /conf/mpt/mpt_30b_mp_v2_2_emb_pt.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/mpt/mpt_30b_mp_v2_2_emb_pt.yaml -------------------------------------------------------------------------------- /conf/roberta_split_fact_v1_1.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/roberta_split_fact_v1_1.yaml -------------------------------------------------------------------------------- /conf/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/template.yaml -------------------------------------------------------------------------------- /conf/test/llama_30b_merit_v1_pv91_v91_v5_0.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/conf/test/llama_30b_merit_v1_pv91_v91_v5_0.yaml -------------------------------------------------------------------------------- /convert2ckpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/convert2ckpt.py -------------------------------------------------------------------------------- /convert2hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/convert2hf.py -------------------------------------------------------------------------------- /data/__init__.py: -------------------------------------------------------------------------------- 1 | """ 2 | Write your own datasets under this directory. 3 | """ -------------------------------------------------------------------------------- /data/collators/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/collators/__init__.py -------------------------------------------------------------------------------- /data/collators/flan.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/collators/flan.py -------------------------------------------------------------------------------- /data/collators/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/collators/misc.py -------------------------------------------------------------------------------- /data/collators/wiki_seq2seq_collator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/collators/wiki_seq2seq_collator.py -------------------------------------------------------------------------------- /data/collators/zh_instruct.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/collators/zh_instruct.py -------------------------------------------------------------------------------- /data/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/data_utils.py -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_100.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_100.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_1000.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_1000.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_1025.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_1025.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_125.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_125.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_150.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_150.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_175.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_175.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_200.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_200.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_225.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_225.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_25.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_25.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_250.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_250.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_275.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_275.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_300.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_300.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_325.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_325.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_350.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_350.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_375.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_375.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_400.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_400.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_425.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_425.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_450.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_450.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_475.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_475.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_50.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_50.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_500.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_500.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_525.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_525.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_550.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_550.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_575.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_575.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_600.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_600.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_625.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_625.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_650.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_650.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_675.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_675.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_700.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_700.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_725.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_725.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_75.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_75.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_750.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_750.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_775.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_775.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_800.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_800.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_825.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_825.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_850.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_850.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_875.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_875.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_900.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_900.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_925.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_925.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_950.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_950.json -------------------------------------------------------------------------------- /data/files/c4/en/p25/partition_975.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p25/partition_975.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_100.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_100.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_1000.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_1000.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_1050.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_1050.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_150.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_150.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_200.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_200.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_250.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_250.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_300.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_300.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_350.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_350.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_400.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_400.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_450.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_450.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_50.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_50.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_500.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_500.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_550.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_550.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_600.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_600.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_650.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_650.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_700.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_700.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_750.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_750.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_800.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_800.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_850.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_850.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_900.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_900.json -------------------------------------------------------------------------------- /data/files/c4/en/p50/partition_950.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/p50/partition_950.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_100.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_100.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_1000.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_1000.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_1100.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_1100.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_200.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_200.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_300.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_300.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_400.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_400.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_500.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_500.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_600.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_600.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_700.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_700.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_800.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_800.json -------------------------------------------------------------------------------- /data/files/c4/en/partition_900.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/c4/en/partition_900.json -------------------------------------------------------------------------------- /data/files/wudao/file_samples_50.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/wudao/file_samples_50.json -------------------------------------------------------------------------------- /data/files/wudao/partition_000.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/wudao/partition_000.json -------------------------------------------------------------------------------- /data/files/wudao/partition_100.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/wudao/partition_100.json -------------------------------------------------------------------------------- /data/files/wudao/partition_200.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/wudao/partition_200.json -------------------------------------------------------------------------------- /data/files/wudao/partition_300.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/wudao/partition_300.json -------------------------------------------------------------------------------- /data/files/wudao/partition_400.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/files/wudao/partition_400.json -------------------------------------------------------------------------------- /data/flan_combine.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/flan_combine.py -------------------------------------------------------------------------------- /data/flan_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/flan_sample.py -------------------------------------------------------------------------------- /data/flan_shuffle.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/flan_shuffle.py -------------------------------------------------------------------------------- /data/mp_inputs_process.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/mp_inputs_process.py -------------------------------------------------------------------------------- /data/preprocessor/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /data/preprocessor/mmlu_merge.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/preprocessor/mmlu_merge.py -------------------------------------------------------------------------------- /data/readers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/readers.py -------------------------------------------------------------------------------- /data/reclor_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/reclor_prompt.py -------------------------------------------------------------------------------- /data/strategy_qa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/strategy_qa.py -------------------------------------------------------------------------------- /data/test.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/data/test.py -------------------------------------------------------------------------------- /ds_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/ds_inference.py -------------------------------------------------------------------------------- /general_util/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /general_util/average_meter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/average_meter.py -------------------------------------------------------------------------------- /general_util/dist_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/dist_utils.py -------------------------------------------------------------------------------- /general_util/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/evaluator.py -------------------------------------------------------------------------------- /general_util/fsdp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/fsdp_utils.py -------------------------------------------------------------------------------- /general_util/lightseq_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/lightseq_utils.py -------------------------------------------------------------------------------- /general_util/logger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/logger.py -------------------------------------------------------------------------------- /general_util/metrics.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/metrics.py -------------------------------------------------------------------------------- /general_util/mixin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/mixin.py -------------------------------------------------------------------------------- /general_util/tensorboard_helper.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/tensorboard_helper.py -------------------------------------------------------------------------------- /general_util/tokenization_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/tokenization_utils.py -------------------------------------------------------------------------------- /general_util/torch_fsdp_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/torch_fsdp_utils.py -------------------------------------------------------------------------------- /general_util/training_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/general_util/training_utils.py -------------------------------------------------------------------------------- /make_delta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/make_delta.py -------------------------------------------------------------------------------- /models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /models/llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/llama.py -------------------------------------------------------------------------------- /models/llama_ds_mp_wrap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/llama_ds_mp_wrap.py -------------------------------------------------------------------------------- /models/mpt/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/README.md -------------------------------------------------------------------------------- /models/mpt/adapt_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/adapt_tokenizer.py -------------------------------------------------------------------------------- /models/mpt/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/attention.py -------------------------------------------------------------------------------- /models/mpt/blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/blocks.py -------------------------------------------------------------------------------- /models/mpt/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/config.json -------------------------------------------------------------------------------- /models/mpt/configuration_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/configuration_mpt.py -------------------------------------------------------------------------------- /models/mpt/custom_embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/custom_embedding.py -------------------------------------------------------------------------------- /models/mpt/flash_attn_triton.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/flash_attn_triton.py -------------------------------------------------------------------------------- /models/mpt/generation_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/generation_config.json -------------------------------------------------------------------------------- /models/mpt/hf_prefixlm_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/hf_prefixlm_converter.py -------------------------------------------------------------------------------- /models/mpt/meta_init_context.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/meta_init_context.py -------------------------------------------------------------------------------- /models/mpt/modeling_mpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/modeling_mpt.py -------------------------------------------------------------------------------- /models/mpt/norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/norm.py -------------------------------------------------------------------------------- /models/mpt/param_init_fns.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/param_init_fns.py -------------------------------------------------------------------------------- /models/mpt/pytorch_model.bin.index.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/pytorch_model.bin.index.json -------------------------------------------------------------------------------- /models/mpt/special_tokens_map.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/special_tokens_map.json -------------------------------------------------------------------------------- /models/mpt/tokenizer.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/tokenizer.json -------------------------------------------------------------------------------- /models/mpt/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt/tokenizer_config.json -------------------------------------------------------------------------------- /models/mpt_ds_mp_wrap.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/mpt_ds_mp_wrap.py -------------------------------------------------------------------------------- /models/patching.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/patching.py -------------------------------------------------------------------------------- /models/patching_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/patching_utils.py -------------------------------------------------------------------------------- /models/roberta.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/roberta.py -------------------------------------------------------------------------------- /models/t5.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/models/t5.py -------------------------------------------------------------------------------- /modules/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /modules/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/modules/layers.py -------------------------------------------------------------------------------- /modules/logits_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/modules/logits_processor.py -------------------------------------------------------------------------------- /modules/trie.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/modules/trie.py -------------------------------------------------------------------------------- /mpt_convert2ckpt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/mpt_convert2ckpt.py -------------------------------------------------------------------------------- /panda_logo.PNG: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/panda_logo.PNG -------------------------------------------------------------------------------- /post_processors/bleu.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/post_processors/bleu.py -------------------------------------------------------------------------------- /post_processors/dist_mixin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/post_processors/dist_mixin.py -------------------------------------------------------------------------------- /post_processors/erica_post_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/post_processors/erica_post_processor.py -------------------------------------------------------------------------------- /post_processors/reclor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/post_processors/reclor.py -------------------------------------------------------------------------------- /post_processors/retrieval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/post_processors/retrieval.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/requirements.txt -------------------------------------------------------------------------------- /seed_multi_run.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/seed_multi_run.sh -------------------------------------------------------------------------------- /trainer_base_ds_mp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_ds_mp.py -------------------------------------------------------------------------------- /trainer_base_ds_mp_aws.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_ds_mp_aws.py -------------------------------------------------------------------------------- /trainer_base_ds_mul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_ds_mul.py -------------------------------------------------------------------------------- /trainer_base_ds_mul_aws.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_ds_mul_aws.py -------------------------------------------------------------------------------- /trainer_base_ds_mul_tb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_ds_mul_tb.py -------------------------------------------------------------------------------- /trainer_base_ds_v1.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_ds_v1.py -------------------------------------------------------------------------------- /trainer_base_fsdp_mul.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_fsdp_mul.py -------------------------------------------------------------------------------- /trainer_base_fsdp_v4.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_base_fsdp_v4.py -------------------------------------------------------------------------------- /trainer_torch_fsdp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_torch_fsdp.py -------------------------------------------------------------------------------- /trainer_torch_fsdp_wandb.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/trainer_torch_fsdp_wandb.py -------------------------------------------------------------------------------- /unify_format.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/dandelionsllm/pandallm/HEAD/unify_format.ipynb --------------------------------------------------------------------------------