├── .gitignore ├── LICENSE ├── README.md ├── evaluate ├── compute_at_acc.py ├── compute_fense.py ├── compute_gender_acc.py ├── compute_map.py ├── compute_qa_acc.py ├── fense │ ├── __init__.py │ ├── data.py │ ├── download_utils.py │ ├── evaluator.py │ ├── fense.py │ └── model.py ├── jsonl │ ├── MiDashengLM_AutoACD.jsonl │ ├── MiDashengLM_FSD50K.jsonl │ ├── MiDashengLM_LibriSpeech_test-clean.jsonl │ ├── MiDashengLM_MuChoMusic.jsonl │ ├── MiDashengLM_MusicQA.jsonl │ ├── MiDashengLM_NSynth.jsonl │ └── MiDashengLM_VoxCeleb-Gender.jsonl ├── prompt.csv └── wer │ ├── cn_tn.py │ ├── compute_wer.py │ ├── evaluate_tokenizer.py │ └── whisper_normalizer │ ├── basic.py │ ├── english.json │ └── english.py ├── fig ├── Framework-1.png ├── Framework.pdf ├── acavcaps-1.png ├── acavcaps.pdf ├── batchsize_1_comparison_7b-1.png ├── batchsize_1_comparison_7b.pdf ├── capabilities_plot_7b-1.png ├── capabilities_plot_7b.pdf ├── convert_pdfs_to_pngs.sh ├── llm_training_loss-1.png ├── llm_training_loss.pdf ├── pretraining_sampling_rates-1.png └── pretraining_sampling_rates.pdf ├── mdl-toolkit ├── .gitignore ├── README.md ├── README_zh.md ├── docs_en │ ├── cli.md │ ├── distributed.md │ ├── esc-50.ipynb │ └── installation.md ├── docs_zh │ ├── cli.md │ ├── distributed.md │ ├── esc-50.ipynb │ └── installation.md ├── mdl_toolkit │ ├── __init__.py │ ├── cli.py │ ├── conversation.py │ ├── convert_dataset.py │ ├── inference.py │ └── train.py └── pyproject.toml ├── requirements.txt └── technical_report └── MiDashengLM_techreport.pdf /.gitignore: -------------------------------------------------------------------------------- 1 | __pycache__ 2 | res_* 3 | process.py 4 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/README.md -------------------------------------------------------------------------------- /evaluate/compute_at_acc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_at_acc.py -------------------------------------------------------------------------------- /evaluate/compute_fense.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_fense.py -------------------------------------------------------------------------------- /evaluate/compute_gender_acc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_gender_acc.py -------------------------------------------------------------------------------- /evaluate/compute_map.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_map.py -------------------------------------------------------------------------------- /evaluate/compute_qa_acc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_qa_acc.py -------------------------------------------------------------------------------- /evaluate/fense/__init__.py: -------------------------------------------------------------------------------- 1 | __version__ = '0.1' -------------------------------------------------------------------------------- /evaluate/fense/data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/data.py -------------------------------------------------------------------------------- /evaluate/fense/download_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/download_utils.py -------------------------------------------------------------------------------- /evaluate/fense/evaluator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/evaluator.py -------------------------------------------------------------------------------- /evaluate/fense/fense.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/fense.py -------------------------------------------------------------------------------- /evaluate/fense/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/model.py -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_AutoACD.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_AutoACD.jsonl -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_FSD50K.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_FSD50K.jsonl -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_LibriSpeech_test-clean.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_LibriSpeech_test-clean.jsonl -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_MuChoMusic.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_MuChoMusic.jsonl -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_MusicQA.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_MusicQA.jsonl -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_NSynth.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_NSynth.jsonl -------------------------------------------------------------------------------- /evaluate/jsonl/MiDashengLM_VoxCeleb-Gender.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_VoxCeleb-Gender.jsonl -------------------------------------------------------------------------------- /evaluate/prompt.csv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/prompt.csv -------------------------------------------------------------------------------- /evaluate/wer/cn_tn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/cn_tn.py -------------------------------------------------------------------------------- /evaluate/wer/compute_wer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/compute_wer.py -------------------------------------------------------------------------------- /evaluate/wer/evaluate_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/evaluate_tokenizer.py -------------------------------------------------------------------------------- /evaluate/wer/whisper_normalizer/basic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/whisper_normalizer/basic.py -------------------------------------------------------------------------------- /evaluate/wer/whisper_normalizer/english.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/whisper_normalizer/english.json -------------------------------------------------------------------------------- /evaluate/wer/whisper_normalizer/english.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/whisper_normalizer/english.py -------------------------------------------------------------------------------- /fig/Framework-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/Framework-1.png -------------------------------------------------------------------------------- /fig/Framework.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/Framework.pdf -------------------------------------------------------------------------------- /fig/acavcaps-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/acavcaps-1.png -------------------------------------------------------------------------------- /fig/acavcaps.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/acavcaps.pdf -------------------------------------------------------------------------------- /fig/batchsize_1_comparison_7b-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/batchsize_1_comparison_7b-1.png -------------------------------------------------------------------------------- /fig/batchsize_1_comparison_7b.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/batchsize_1_comparison_7b.pdf -------------------------------------------------------------------------------- /fig/capabilities_plot_7b-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/capabilities_plot_7b-1.png -------------------------------------------------------------------------------- /fig/capabilities_plot_7b.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/capabilities_plot_7b.pdf -------------------------------------------------------------------------------- /fig/convert_pdfs_to_pngs.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/convert_pdfs_to_pngs.sh -------------------------------------------------------------------------------- /fig/llm_training_loss-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/llm_training_loss-1.png -------------------------------------------------------------------------------- /fig/llm_training_loss.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/llm_training_loss.pdf -------------------------------------------------------------------------------- /fig/pretraining_sampling_rates-1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/pretraining_sampling_rates-1.png -------------------------------------------------------------------------------- /fig/pretraining_sampling_rates.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/pretraining_sampling_rates.pdf -------------------------------------------------------------------------------- /mdl-toolkit/.gitignore: -------------------------------------------------------------------------------- 1 | __pycache__ 2 | uv.lock 3 | *.egg-info/ 4 | build/ 5 | dist/ 6 | -------------------------------------------------------------------------------- /mdl-toolkit/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/README.md -------------------------------------------------------------------------------- /mdl-toolkit/README_zh.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/README_zh.md -------------------------------------------------------------------------------- /mdl-toolkit/docs_en/cli.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/cli.md -------------------------------------------------------------------------------- /mdl-toolkit/docs_en/distributed.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/distributed.md -------------------------------------------------------------------------------- /mdl-toolkit/docs_en/esc-50.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/esc-50.ipynb -------------------------------------------------------------------------------- /mdl-toolkit/docs_en/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/installation.md -------------------------------------------------------------------------------- /mdl-toolkit/docs_zh/cli.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/cli.md -------------------------------------------------------------------------------- /mdl-toolkit/docs_zh/distributed.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/distributed.md -------------------------------------------------------------------------------- /mdl-toolkit/docs_zh/esc-50.ipynb: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/esc-50.ipynb -------------------------------------------------------------------------------- /mdl-toolkit/docs_zh/installation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/installation.md -------------------------------------------------------------------------------- /mdl-toolkit/mdl_toolkit/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /mdl-toolkit/mdl_toolkit/cli.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/cli.py -------------------------------------------------------------------------------- /mdl-toolkit/mdl_toolkit/conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/conversation.py -------------------------------------------------------------------------------- /mdl-toolkit/mdl_toolkit/convert_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/convert_dataset.py -------------------------------------------------------------------------------- /mdl-toolkit/mdl_toolkit/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/inference.py -------------------------------------------------------------------------------- /mdl-toolkit/mdl_toolkit/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/train.py -------------------------------------------------------------------------------- /mdl-toolkit/pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/pyproject.toml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/requirements.txt -------------------------------------------------------------------------------- /technical_report/MiDashengLM_techreport.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/technical_report/MiDashengLM_techreport.pdf --------------------------------------------------------------------------------