├── .gitignore ├── LICENSE ├── README.md ├── assets └── teaser.png ├── docs ├── ENV.md ├── EXP.md ├── HF.md └── LINK.md ├── exp ├── 250318-eval-baseline_llm │ ├── h100.makefile │ ├── l40s.makefile │ └── qwen_w_wo_cot.makefile ├── 250318-eval-medical_llm │ ├── above_10b.makefile │ ├── below_10b.makefile │ └── template.makefile ├── 250319-ablation │ ├── h100.data_curation.makefile │ ├── h100.extraplate_thinking_budget.makefile │ ├── h100.makefile │ ├── keep_thinking_below_budget.makefile │ ├── l40s.makefile │ └── thinking_budget.makefile ├── eval_commands.sh └── train_commands.sh ├── requirements.m1.txt └── src ├── ablate_data ├── distill_random.sh ├── filtering_r1_wrong.ipynb ├── random_select.ipynb ├── select_hard_sample_by_domain.ipynb └── upload_data.ipynb ├── analyse ├── gather_results.py ├── gather_results.template.ipynb ├── gather_time.py ├── stats_data_source_domain.ipynb ├── stats_token_length.ipynb └── stats_token_length_paper.ipynb ├── collect_data ├── __init__.py ├── decontaminate.py ├── deduplicate.py ├── headqa.py ├── medmcqa.py ├── medqa.py ├── merge_data.py ├── pubmedqa.py └── utils.py ├── collect_eval_data └── collect_eval_data.py ├── distill_data ├── __init__.py ├── decontaminate_eval.py ├── distill_data.py ├── filtering_qwen_correct.ipynb ├── filtering_r1_wrong.ipynb ├── prompt.py └── upload_curator_responses.py ├── eval ├── __init__.py ├── configs │ └── base.yaml ├── extract_format.py ├── inference_keep_think.py ├── kill_sglang_server.sh └── score.py ├── select_data ├── __init__.py ├── build_prompt.py ├── classify_sample.py ├── extract_domain.py ├── mesh_qualifier.json ├── mesh_qualifier_hierarchical.json ├── qualifier_scope_note.tsv ├── raw_mesh_qualifer_list.txt ├── select_hard_sample_by_domain_source.ipynb └── stats_domain.ipynb ├── tokenize_data ├── apply_chat_template.py └── upload_data.ipynb └── train ├── fsdp_config_qwen.json ├── fsdp_config_qwen_cpu.json ├── launch.sh ├── sft.py ├── sft_local.sh └── sft_slurm.sh /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/README.md -------------------------------------------------------------------------------- /assets/teaser.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/assets/teaser.png -------------------------------------------------------------------------------- /docs/ENV.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/docs/ENV.md -------------------------------------------------------------------------------- /docs/EXP.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/docs/EXP.md -------------------------------------------------------------------------------- /docs/HF.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/docs/HF.md -------------------------------------------------------------------------------- /docs/LINK.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/docs/LINK.md -------------------------------------------------------------------------------- /exp/250318-eval-baseline_llm/h100.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250318-eval-baseline_llm/h100.makefile -------------------------------------------------------------------------------- /exp/250318-eval-baseline_llm/l40s.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250318-eval-baseline_llm/l40s.makefile -------------------------------------------------------------------------------- /exp/250318-eval-baseline_llm/qwen_w_wo_cot.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250318-eval-baseline_llm/qwen_w_wo_cot.makefile -------------------------------------------------------------------------------- /exp/250318-eval-medical_llm/above_10b.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250318-eval-medical_llm/above_10b.makefile -------------------------------------------------------------------------------- /exp/250318-eval-medical_llm/below_10b.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250318-eval-medical_llm/below_10b.makefile -------------------------------------------------------------------------------- /exp/250318-eval-medical_llm/template.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250318-eval-medical_llm/template.makefile -------------------------------------------------------------------------------- /exp/250319-ablation/h100.data_curation.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250319-ablation/h100.data_curation.makefile -------------------------------------------------------------------------------- /exp/250319-ablation/h100.extraplate_thinking_budget.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250319-ablation/h100.extraplate_thinking_budget.makefile -------------------------------------------------------------------------------- /exp/250319-ablation/h100.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250319-ablation/h100.makefile -------------------------------------------------------------------------------- /exp/250319-ablation/keep_thinking_below_budget.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250319-ablation/keep_thinking_below_budget.makefile -------------------------------------------------------------------------------- /exp/250319-ablation/l40s.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250319-ablation/l40s.makefile -------------------------------------------------------------------------------- /exp/250319-ablation/thinking_budget.makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/250319-ablation/thinking_budget.makefile -------------------------------------------------------------------------------- /exp/eval_commands.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/eval_commands.sh -------------------------------------------------------------------------------- /exp/train_commands.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/exp/train_commands.sh -------------------------------------------------------------------------------- /requirements.m1.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/requirements.m1.txt -------------------------------------------------------------------------------- /src/ablate_data/distill_random.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/ablate_data/distill_random.sh -------------------------------------------------------------------------------- /src/ablate_data/filtering_r1_wrong.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/ablate_data/filtering_r1_wrong.ipynb -------------------------------------------------------------------------------- /src/ablate_data/random_select.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/ablate_data/random_select.ipynb -------------------------------------------------------------------------------- /src/ablate_data/select_hard_sample_by_domain.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/ablate_data/select_hard_sample_by_domain.ipynb -------------------------------------------------------------------------------- /src/ablate_data/upload_data.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/ablate_data/upload_data.ipynb -------------------------------------------------------------------------------- /src/analyse/gather_results.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/analyse/gather_results.py -------------------------------------------------------------------------------- /src/analyse/gather_results.template.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/analyse/gather_results.template.ipynb -------------------------------------------------------------------------------- /src/analyse/gather_time.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/analyse/gather_time.py -------------------------------------------------------------------------------- /src/analyse/stats_data_source_domain.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/analyse/stats_data_source_domain.ipynb -------------------------------------------------------------------------------- /src/analyse/stats_token_length.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/analyse/stats_token_length.ipynb -------------------------------------------------------------------------------- /src/analyse/stats_token_length_paper.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/analyse/stats_token_length_paper.ipynb -------------------------------------------------------------------------------- /src/collect_data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/collect_data/decontaminate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/decontaminate.py -------------------------------------------------------------------------------- /src/collect_data/deduplicate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/deduplicate.py -------------------------------------------------------------------------------- /src/collect_data/headqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/headqa.py -------------------------------------------------------------------------------- /src/collect_data/medmcqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/medmcqa.py -------------------------------------------------------------------------------- /src/collect_data/medqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/medqa.py -------------------------------------------------------------------------------- /src/collect_data/merge_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/merge_data.py -------------------------------------------------------------------------------- /src/collect_data/pubmedqa.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/pubmedqa.py -------------------------------------------------------------------------------- /src/collect_data/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_data/utils.py -------------------------------------------------------------------------------- /src/collect_eval_data/collect_eval_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/collect_eval_data/collect_eval_data.py -------------------------------------------------------------------------------- /src/distill_data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/distill_data/decontaminate_eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/distill_data/decontaminate_eval.py -------------------------------------------------------------------------------- /src/distill_data/distill_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/distill_data/distill_data.py -------------------------------------------------------------------------------- /src/distill_data/filtering_qwen_correct.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/distill_data/filtering_qwen_correct.ipynb -------------------------------------------------------------------------------- /src/distill_data/filtering_r1_wrong.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/distill_data/filtering_r1_wrong.ipynb -------------------------------------------------------------------------------- /src/distill_data/prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/distill_data/prompt.py -------------------------------------------------------------------------------- /src/distill_data/upload_curator_responses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/distill_data/upload_curator_responses.py -------------------------------------------------------------------------------- /src/eval/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/eval/configs/base.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/eval/configs/base.yaml -------------------------------------------------------------------------------- /src/eval/extract_format.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/eval/extract_format.py -------------------------------------------------------------------------------- /src/eval/inference_keep_think.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/eval/inference_keep_think.py -------------------------------------------------------------------------------- /src/eval/kill_sglang_server.sh: -------------------------------------------------------------------------------- 1 | pgrep 'sglang' -f | xargs kill -9 2 | echo "Exit" -------------------------------------------------------------------------------- /src/eval/score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/eval/score.py -------------------------------------------------------------------------------- /src/select_data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/select_data/build_prompt.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/build_prompt.py -------------------------------------------------------------------------------- /src/select_data/classify_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/classify_sample.py -------------------------------------------------------------------------------- /src/select_data/extract_domain.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/extract_domain.py -------------------------------------------------------------------------------- /src/select_data/mesh_qualifier.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/mesh_qualifier.json -------------------------------------------------------------------------------- /src/select_data/mesh_qualifier_hierarchical.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/mesh_qualifier_hierarchical.json -------------------------------------------------------------------------------- /src/select_data/qualifier_scope_note.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/qualifier_scope_note.tsv -------------------------------------------------------------------------------- /src/select_data/raw_mesh_qualifer_list.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/raw_mesh_qualifer_list.txt -------------------------------------------------------------------------------- /src/select_data/select_hard_sample_by_domain_source.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/select_hard_sample_by_domain_source.ipynb -------------------------------------------------------------------------------- /src/select_data/stats_domain.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/select_data/stats_domain.ipynb -------------------------------------------------------------------------------- /src/tokenize_data/apply_chat_template.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/tokenize_data/apply_chat_template.py -------------------------------------------------------------------------------- /src/tokenize_data/upload_data.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/tokenize_data/upload_data.ipynb -------------------------------------------------------------------------------- /src/train/fsdp_config_qwen.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/train/fsdp_config_qwen.json -------------------------------------------------------------------------------- /src/train/fsdp_config_qwen_cpu.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/train/fsdp_config_qwen_cpu.json -------------------------------------------------------------------------------- /src/train/launch.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/train/launch.sh -------------------------------------------------------------------------------- /src/train/sft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/train/sft.py -------------------------------------------------------------------------------- /src/train/sft_local.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/train/sft_local.sh -------------------------------------------------------------------------------- /src/train/sft_slurm.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/UCSC-VLAA/m1/HEAD/src/train/sft_slurm.sh --------------------------------------------------------------------------------