├── .gitignore ├── 0.download_data.sh ├── 1.data_process_test&dev.sh ├── 2.data_process_train.sh ├── 3.single_node_train_gemma.sh ├── 4.eval.sh ├── LICENSE.txt ├── README.md ├── assets ├── apollo_medium_final.png ├── dataset.png ├── final.png └── result.png ├── metadata ├── dev.json ├── dev │ ├── ar.json │ ├── en.json │ ├── es.json │ ├── fr.json │ ├── hi.json │ └── zh.json ├── merge_json_train.py ├── test.json └── test │ ├── ar.json │ ├── en.json │ ├── es.json │ ├── fr.json │ ├── hi.json │ └── zh.json ├── requirements.txt ├── scripts ├── 3.multinode_train_gema7B_rank0.sh ├── 3.multinode_train_gema7B_rank1.sh └── 3.multinode_train_gema7B_rank2.sh ├── src ├── evaluate │ ├── cli_demo.py │ ├── eval_72b_34b.py │ ├── eval_gemma.py │ ├── eval_huatuo2.py │ ├── eval_llama2.py │ ├── eval_llama70b.py │ ├── eval_meditron.py │ ├── eval_meditron70b.py │ ├── eval_mistral.py │ ├── eval_mmedlm2.py │ ├── eval_qwen.py │ ├── eval_yi.py │ ├── eval_zephyr.py │ └── generate_score.py ├── process │ ├── openai_rewrite │ │ ├── OpenAIGPT.py │ │ ├── OpenAIGPT_datagen_multithread.py │ │ ├── gpt_key.txt │ │ ├── guidelines_en │ │ │ ├── 1.2.prepare_data.py │ │ │ ├── 1.prepare_data.py │ │ │ ├── 1.run_prepare_data.sh │ │ │ ├── 2.run_gpt_datagen_multithread.sh │ │ │ ├── 3.extract.py │ │ │ └── data │ │ │ │ └── 1.dev.jsonl │ │ └── patient_en │ │ │ ├── 1.2.prepare_data.py │ │ │ ├── 1.prepare_data.py │ │ │ ├── 1.run_prepare_data.sh │ │ │ ├── 2.run_gpt_datagen_multithread.sh │ │ │ ├── 3.extract.py │ │ │ └── data │ │ │ └── 1.dev.jsonl │ └── prepare │ │ ├── data_process_test_gemma.py │ │ ├── data_process_test_huatuo2.py │ │ ├── data_process_test_llama.py │ │ ├── data_process_test_meditron.py │ │ ├── data_process_test_mistral.py │ │ ├── data_process_test_qwen.py │ │ ├── data_process_test_yi.py │ │ ├── data_process_test_zephyr.py │ │ ├── data_process_train_gemma.py │ │ ├── data_process_train_qwen.py │ │ └── data_process_train_yi.py ├── proxy-tuning │ ├── eval │ │ ├── apollodata │ │ │ └── run_eval.py │ │ └── utils.py │ ├── modeling │ │ └── mexperts.py │ └── scripts │ │ └── eval │ │ └── proxy_tuning.sh └── sft │ ├── train_gemma_resume_val.py │ ├── train_qwen_resume_val.py │ ├── train_yi_resume_val.py │ └── training_config │ ├── zero.yaml │ └── zero_multi.yaml └── utils ├── check.ipynb └── kill.sh /.gitignore: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /0.download_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/0.download_data.sh -------------------------------------------------------------------------------- /1.data_process_test&dev.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/1.data_process_test&dev.sh -------------------------------------------------------------------------------- /2.data_process_train.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/2.data_process_train.sh -------------------------------------------------------------------------------- /3.single_node_train_gemma.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/3.single_node_train_gemma.sh -------------------------------------------------------------------------------- /4.eval.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/4.eval.sh -------------------------------------------------------------------------------- /LICENSE.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/LICENSE.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/README.md -------------------------------------------------------------------------------- /assets/apollo_medium_final.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/assets/apollo_medium_final.png -------------------------------------------------------------------------------- /assets/dataset.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/assets/dataset.png -------------------------------------------------------------------------------- /assets/final.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/assets/final.png -------------------------------------------------------------------------------- /assets/result.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/assets/result.png -------------------------------------------------------------------------------- /metadata/dev.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev.json -------------------------------------------------------------------------------- /metadata/dev/ar.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev/ar.json -------------------------------------------------------------------------------- /metadata/dev/en.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev/en.json -------------------------------------------------------------------------------- /metadata/dev/es.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev/es.json -------------------------------------------------------------------------------- /metadata/dev/fr.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev/fr.json -------------------------------------------------------------------------------- /metadata/dev/hi.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev/hi.json -------------------------------------------------------------------------------- /metadata/dev/zh.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/dev/zh.json -------------------------------------------------------------------------------- /metadata/merge_json_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/merge_json_train.py -------------------------------------------------------------------------------- /metadata/test.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test.json -------------------------------------------------------------------------------- /metadata/test/ar.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test/ar.json -------------------------------------------------------------------------------- /metadata/test/en.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test/en.json -------------------------------------------------------------------------------- /metadata/test/es.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test/es.json -------------------------------------------------------------------------------- /metadata/test/fr.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test/fr.json -------------------------------------------------------------------------------- /metadata/test/hi.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test/hi.json -------------------------------------------------------------------------------- /metadata/test/zh.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/metadata/test/zh.json -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- 1 | llama-index-llms-vllm -------------------------------------------------------------------------------- /scripts/3.multinode_train_gema7B_rank0.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/scripts/3.multinode_train_gema7B_rank0.sh -------------------------------------------------------------------------------- /scripts/3.multinode_train_gema7B_rank1.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/scripts/3.multinode_train_gema7B_rank1.sh -------------------------------------------------------------------------------- /scripts/3.multinode_train_gema7B_rank2.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/scripts/3.multinode_train_gema7B_rank2.sh -------------------------------------------------------------------------------- /src/evaluate/cli_demo.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/cli_demo.py -------------------------------------------------------------------------------- /src/evaluate/eval_72b_34b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_72b_34b.py -------------------------------------------------------------------------------- /src/evaluate/eval_gemma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_gemma.py -------------------------------------------------------------------------------- /src/evaluate/eval_huatuo2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_huatuo2.py -------------------------------------------------------------------------------- /src/evaluate/eval_llama2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_llama2.py -------------------------------------------------------------------------------- /src/evaluate/eval_llama70b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_llama70b.py -------------------------------------------------------------------------------- /src/evaluate/eval_meditron.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_meditron.py -------------------------------------------------------------------------------- /src/evaluate/eval_meditron70b.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_meditron70b.py -------------------------------------------------------------------------------- /src/evaluate/eval_mistral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_mistral.py -------------------------------------------------------------------------------- /src/evaluate/eval_mmedlm2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_mmedlm2.py -------------------------------------------------------------------------------- /src/evaluate/eval_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_qwen.py -------------------------------------------------------------------------------- /src/evaluate/eval_yi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_yi.py -------------------------------------------------------------------------------- /src/evaluate/eval_zephyr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/eval_zephyr.py -------------------------------------------------------------------------------- /src/evaluate/generate_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/evaluate/generate_score.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/OpenAIGPT.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/OpenAIGPT.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/OpenAIGPT_datagen_multithread.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/OpenAIGPT_datagen_multithread.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/gpt_key.txt: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/process/openai_rewrite/guidelines_en/1.2.prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/guidelines_en/1.2.prepare_data.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/guidelines_en/1.prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/guidelines_en/1.prepare_data.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/guidelines_en/1.run_prepare_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/guidelines_en/1.run_prepare_data.sh -------------------------------------------------------------------------------- /src/process/openai_rewrite/guidelines_en/2.run_gpt_datagen_multithread.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/guidelines_en/2.run_gpt_datagen_multithread.sh -------------------------------------------------------------------------------- /src/process/openai_rewrite/guidelines_en/3.extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/guidelines_en/3.extract.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/guidelines_en/data/1.dev.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/guidelines_en/data/1.dev.jsonl -------------------------------------------------------------------------------- /src/process/openai_rewrite/patient_en/1.2.prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/patient_en/1.2.prepare_data.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/patient_en/1.prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/patient_en/1.prepare_data.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/patient_en/1.run_prepare_data.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/patient_en/1.run_prepare_data.sh -------------------------------------------------------------------------------- /src/process/openai_rewrite/patient_en/2.run_gpt_datagen_multithread.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/patient_en/2.run_gpt_datagen_multithread.sh -------------------------------------------------------------------------------- /src/process/openai_rewrite/patient_en/3.extract.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/patient_en/3.extract.py -------------------------------------------------------------------------------- /src/process/openai_rewrite/patient_en/data/1.dev.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/openai_rewrite/patient_en/data/1.dev.jsonl -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_gemma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_gemma.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_huatuo2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_huatuo2.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_llama.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_llama.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_meditron.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_meditron.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_mistral.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_mistral.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_qwen.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_yi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_yi.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_test_zephyr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_test_zephyr.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_train_gemma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_train_gemma.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_train_qwen.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_train_qwen.py -------------------------------------------------------------------------------- /src/process/prepare/data_process_train_yi.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/process/prepare/data_process_train_yi.py -------------------------------------------------------------------------------- /src/proxy-tuning/eval/apollodata/run_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/proxy-tuning/eval/apollodata/run_eval.py -------------------------------------------------------------------------------- /src/proxy-tuning/eval/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/proxy-tuning/eval/utils.py -------------------------------------------------------------------------------- /src/proxy-tuning/modeling/mexperts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/proxy-tuning/modeling/mexperts.py -------------------------------------------------------------------------------- /src/proxy-tuning/scripts/eval/proxy_tuning.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/proxy-tuning/scripts/eval/proxy_tuning.sh -------------------------------------------------------------------------------- /src/sft/train_gemma_resume_val.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/sft/train_gemma_resume_val.py -------------------------------------------------------------------------------- /src/sft/train_qwen_resume_val.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/sft/train_qwen_resume_val.py -------------------------------------------------------------------------------- /src/sft/train_yi_resume_val.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/sft/train_yi_resume_val.py -------------------------------------------------------------------------------- /src/sft/training_config/zero.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/sft/training_config/zero.yaml -------------------------------------------------------------------------------- /src/sft/training_config/zero_multi.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/src/sft/training_config/zero_multi.yaml -------------------------------------------------------------------------------- /utils/check.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/utils/check.ipynb -------------------------------------------------------------------------------- /utils/kill.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/FreedomIntelligence/Apollo/HEAD/utils/kill.sh --------------------------------------------------------------------------------