├── .gitignore
├── LICENSE
├── README.md
├── evaluate
    ├── compute_at_acc.py
    ├── compute_fense.py
    ├── compute_gender_acc.py
    ├── compute_map.py
    ├── compute_qa_acc.py
    ├── fense
    │   ├── __init__.py
    │   ├── data.py
    │   ├── download_utils.py
    │   ├── evaluator.py
    │   ├── fense.py
    │   └── model.py
    ├── jsonl
    │   ├── MiDashengLM_AutoACD.jsonl
    │   ├── MiDashengLM_FSD50K.jsonl
    │   ├── MiDashengLM_LibriSpeech_test-clean.jsonl
    │   ├── MiDashengLM_MuChoMusic.jsonl
    │   ├── MiDashengLM_MusicQA.jsonl
    │   ├── MiDashengLM_NSynth.jsonl
    │   └── MiDashengLM_VoxCeleb-Gender.jsonl
    ├── prompt.csv
    └── wer
    │   ├── cn_tn.py
    │   ├── compute_wer.py
    │   ├── evaluate_tokenizer.py
    │   └── whisper_normalizer
    │       ├── basic.py
    │       ├── english.json
    │       └── english.py
├── fig
    ├── Framework-1.png
    ├── Framework.pdf
    ├── acavcaps-1.png
    ├── acavcaps.pdf
    ├── batchsize_1_comparison_7b-1.png
    ├── batchsize_1_comparison_7b.pdf
    ├── capabilities_plot_7b-1.png
    ├── capabilities_plot_7b.pdf
    ├── convert_pdfs_to_pngs.sh
    ├── llm_training_loss-1.png
    ├── llm_training_loss.pdf
    ├── pretraining_sampling_rates-1.png
    └── pretraining_sampling_rates.pdf
├── mdl-toolkit
    ├── .gitignore
    ├── README.md
    ├── README_zh.md
    ├── docs_en
    │   ├── cli.md
    │   ├── distributed.md
    │   ├── esc-50.ipynb
    │   └── installation.md
    ├── docs_zh
    │   ├── cli.md
    │   ├── distributed.md
    │   ├── esc-50.ipynb
    │   └── installation.md
    ├── mdl_toolkit
    │   ├── __init__.py
    │   ├── cli.py
    │   ├── conversation.py
    │   ├── convert_dataset.py
    │   ├── inference.py
    │   └── train.py
    └── pyproject.toml
├── requirements.txt
└── technical_report
    └── MiDashengLM_techreport.pdf


/.gitignore:
--------------------------------------------------------------------------------
1 | __pycache__
2 | res_*
3 | process.py
4 | 


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/LICENSE


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/README.md


--------------------------------------------------------------------------------
/evaluate/compute_at_acc.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_at_acc.py


--------------------------------------------------------------------------------
/evaluate/compute_fense.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_fense.py


--------------------------------------------------------------------------------
/evaluate/compute_gender_acc.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_gender_acc.py


--------------------------------------------------------------------------------
/evaluate/compute_map.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_map.py


--------------------------------------------------------------------------------
/evaluate/compute_qa_acc.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/compute_qa_acc.py


--------------------------------------------------------------------------------
/evaluate/fense/__init__.py:
--------------------------------------------------------------------------------
1 | __version__ = '0.1'


--------------------------------------------------------------------------------
/evaluate/fense/data.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/data.py


--------------------------------------------------------------------------------
/evaluate/fense/download_utils.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/download_utils.py


--------------------------------------------------------------------------------
/evaluate/fense/evaluator.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/evaluator.py


--------------------------------------------------------------------------------
/evaluate/fense/fense.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/fense.py


--------------------------------------------------------------------------------
/evaluate/fense/model.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/fense/model.py


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_AutoACD.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_AutoACD.jsonl


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_FSD50K.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_FSD50K.jsonl


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_LibriSpeech_test-clean.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_LibriSpeech_test-clean.jsonl


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_MuChoMusic.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_MuChoMusic.jsonl


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_MusicQA.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_MusicQA.jsonl


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_NSynth.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_NSynth.jsonl


--------------------------------------------------------------------------------
/evaluate/jsonl/MiDashengLM_VoxCeleb-Gender.jsonl:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/jsonl/MiDashengLM_VoxCeleb-Gender.jsonl


--------------------------------------------------------------------------------
/evaluate/prompt.csv:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/prompt.csv


--------------------------------------------------------------------------------
/evaluate/wer/cn_tn.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/cn_tn.py


--------------------------------------------------------------------------------
/evaluate/wer/compute_wer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/compute_wer.py


--------------------------------------------------------------------------------
/evaluate/wer/evaluate_tokenizer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/evaluate_tokenizer.py


--------------------------------------------------------------------------------
/evaluate/wer/whisper_normalizer/basic.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/whisper_normalizer/basic.py


--------------------------------------------------------------------------------
/evaluate/wer/whisper_normalizer/english.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/whisper_normalizer/english.json


--------------------------------------------------------------------------------
/evaluate/wer/whisper_normalizer/english.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/evaluate/wer/whisper_normalizer/english.py


--------------------------------------------------------------------------------
/fig/Framework-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/Framework-1.png


--------------------------------------------------------------------------------
/fig/Framework.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/Framework.pdf


--------------------------------------------------------------------------------
/fig/acavcaps-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/acavcaps-1.png


--------------------------------------------------------------------------------
/fig/acavcaps.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/acavcaps.pdf


--------------------------------------------------------------------------------
/fig/batchsize_1_comparison_7b-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/batchsize_1_comparison_7b-1.png


--------------------------------------------------------------------------------
/fig/batchsize_1_comparison_7b.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/batchsize_1_comparison_7b.pdf


--------------------------------------------------------------------------------
/fig/capabilities_plot_7b-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/capabilities_plot_7b-1.png


--------------------------------------------------------------------------------
/fig/capabilities_plot_7b.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/capabilities_plot_7b.pdf


--------------------------------------------------------------------------------
/fig/convert_pdfs_to_pngs.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/convert_pdfs_to_pngs.sh


--------------------------------------------------------------------------------
/fig/llm_training_loss-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/llm_training_loss-1.png


--------------------------------------------------------------------------------
/fig/llm_training_loss.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/llm_training_loss.pdf


--------------------------------------------------------------------------------
/fig/pretraining_sampling_rates-1.png:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/pretraining_sampling_rates-1.png


--------------------------------------------------------------------------------
/fig/pretraining_sampling_rates.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/fig/pretraining_sampling_rates.pdf


--------------------------------------------------------------------------------
/mdl-toolkit/.gitignore:
--------------------------------------------------------------------------------
1 | __pycache__
2 | uv.lock
3 | *.egg-info/
4 | build/
5 | dist/
6 | 


--------------------------------------------------------------------------------
/mdl-toolkit/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/README.md


--------------------------------------------------------------------------------
/mdl-toolkit/README_zh.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/README_zh.md


--------------------------------------------------------------------------------
/mdl-toolkit/docs_en/cli.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/cli.md


--------------------------------------------------------------------------------
/mdl-toolkit/docs_en/distributed.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/distributed.md


--------------------------------------------------------------------------------
/mdl-toolkit/docs_en/esc-50.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/esc-50.ipynb


--------------------------------------------------------------------------------
/mdl-toolkit/docs_en/installation.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_en/installation.md


--------------------------------------------------------------------------------
/mdl-toolkit/docs_zh/cli.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/cli.md


--------------------------------------------------------------------------------
/mdl-toolkit/docs_zh/distributed.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/distributed.md


--------------------------------------------------------------------------------
/mdl-toolkit/docs_zh/esc-50.ipynb:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/esc-50.ipynb


--------------------------------------------------------------------------------
/mdl-toolkit/docs_zh/installation.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/docs_zh/installation.md


--------------------------------------------------------------------------------
/mdl-toolkit/mdl_toolkit/__init__.py:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/mdl-toolkit/mdl_toolkit/cli.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/cli.py


--------------------------------------------------------------------------------
/mdl-toolkit/mdl_toolkit/conversation.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/conversation.py


--------------------------------------------------------------------------------
/mdl-toolkit/mdl_toolkit/convert_dataset.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/convert_dataset.py


--------------------------------------------------------------------------------
/mdl-toolkit/mdl_toolkit/inference.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/inference.py


--------------------------------------------------------------------------------
/mdl-toolkit/mdl_toolkit/train.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/mdl_toolkit/train.py


--------------------------------------------------------------------------------
/mdl-toolkit/pyproject.toml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/mdl-toolkit/pyproject.toml


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/requirements.txt


--------------------------------------------------------------------------------
/technical_report/MiDashengLM_techreport.pdf:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/xiaomi-research/dasheng-lm/HEAD/technical_report/MiDashengLM_techreport.pdf


--------------------------------------------------------------------------------