├── License.txt ├── README.md ├── assets ├── answer.wav ├── asr_res.png ├── latency.png ├── logo.png ├── out_cer.png ├── overview.png ├── qa.png ├── question.wav ├── system.png └── wechat_code.jpg ├── bin ├── inference.py └── server.py ├── models ├── adapter.py ├── audioLLM.py ├── decoder │ ├── decoder.py │ ├── llm2tts.py │ └── ticodec │ │ ├── models.py │ │ ├── vqvae.py │ │ └── vqvae_tester.py ├── encoder │ ├── attention.py │ ├── cmvn.py │ ├── encoder.py │ ├── subsampling.py │ └── transformer.py ├── masks.py ├── pipeline.py └── utils.py ├── requirements.txt ├── scripts ├── run_demo_server.sh └── run_inference.sh └── web ├── parms.py ├── pem.py ├── pool.py ├── queue.py ├── resources └── demo.html └── vad.py /License.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/License.txt -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/README.md -------------------------------------------------------------------------------- /assets/answer.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/answer.wav -------------------------------------------------------------------------------- /assets/asr_res.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/asr_res.png -------------------------------------------------------------------------------- /assets/latency.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/latency.png -------------------------------------------------------------------------------- /assets/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/logo.png -------------------------------------------------------------------------------- /assets/out_cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/out_cer.png -------------------------------------------------------------------------------- /assets/overview.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/overview.png -------------------------------------------------------------------------------- /assets/qa.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/qa.png -------------------------------------------------------------------------------- /assets/question.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/question.wav -------------------------------------------------------------------------------- /assets/system.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/system.png -------------------------------------------------------------------------------- /assets/wechat_code.jpg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/assets/wechat_code.jpg -------------------------------------------------------------------------------- /bin/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/bin/inference.py -------------------------------------------------------------------------------- /bin/server.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/bin/server.py -------------------------------------------------------------------------------- /models/adapter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/adapter.py -------------------------------------------------------------------------------- /models/audioLLM.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/audioLLM.py -------------------------------------------------------------------------------- /models/decoder/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/decoder/decoder.py -------------------------------------------------------------------------------- /models/decoder/llm2tts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/decoder/llm2tts.py -------------------------------------------------------------------------------- /models/decoder/ticodec/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/decoder/ticodec/models.py -------------------------------------------------------------------------------- /models/decoder/ticodec/vqvae.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/decoder/ticodec/vqvae.py -------------------------------------------------------------------------------- /models/decoder/ticodec/vqvae_tester.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/decoder/ticodec/vqvae_tester.py -------------------------------------------------------------------------------- /models/encoder/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/encoder/attention.py -------------------------------------------------------------------------------- /models/encoder/cmvn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/encoder/cmvn.py -------------------------------------------------------------------------------- /models/encoder/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/encoder/encoder.py -------------------------------------------------------------------------------- /models/encoder/subsampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/encoder/subsampling.py -------------------------------------------------------------------------------- /models/encoder/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/encoder/transformer.py -------------------------------------------------------------------------------- /models/masks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/masks.py -------------------------------------------------------------------------------- /models/pipeline.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/pipeline.py -------------------------------------------------------------------------------- /models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/models/utils.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/requirements.txt -------------------------------------------------------------------------------- /scripts/run_demo_server.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/scripts/run_demo_server.sh -------------------------------------------------------------------------------- /scripts/run_inference.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/scripts/run_inference.sh -------------------------------------------------------------------------------- /web/parms.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/web/parms.py -------------------------------------------------------------------------------- /web/pem.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/web/pem.py -------------------------------------------------------------------------------- /web/pool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/web/pool.py -------------------------------------------------------------------------------- /web/queue.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/web/queue.py -------------------------------------------------------------------------------- /web/resources/demo.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/web/resources/demo.html -------------------------------------------------------------------------------- /web/vad.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/VITA-MLLM/Freeze-Omni/HEAD/web/vad.py --------------------------------------------------------------------------------