├── .gitignore ├── LICENSE ├── README.md ├── defaults.ini ├── example ├── V2A_sample-1.mp4 ├── V2A_sample-2.mp4 ├── V2A_sample-3.mp4 ├── V2M_sample-1.mp4 ├── V2M_sample-2.mp4 └── V2M_sample-3.mp4 ├── pyproject.toml ├── run_gradio.py ├── setup.py └── stable_audio_tools ├── __init__.py ├── data ├── __init__.py ├── dataset.py └── utils.py ├── inference ├── __init__.py ├── generation.py ├── sampling.py └── utils.py ├── interface ├── __init__.py └── gradio.py ├── models ├── __init__.py ├── adp.py ├── autoencoders.py ├── blocks.py ├── bottleneck.py ├── codebook_patterns.py ├── conditioners.py ├── diffusion.py ├── discriminators.py ├── dit.py ├── factory.py ├── lm.py ├── local_attention.py ├── pqmf.py ├── pretrained.py ├── pretransforms.py ├── temptransformer.py ├── transformer.py ├── utils.py └── wavelets.py └── training ├── __init__.py ├── autoencoders.py ├── diffusion.py ├── factory.py ├── lm.py ├── losses ├── __init__.py ├── auraloss.py └── losses.py └── utils.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/README.md -------------------------------------------------------------------------------- /defaults.ini: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/defaults.ini -------------------------------------------------------------------------------- /example/V2A_sample-1.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/example/V2A_sample-1.mp4 -------------------------------------------------------------------------------- /example/V2A_sample-2.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/example/V2A_sample-2.mp4 -------------------------------------------------------------------------------- /example/V2A_sample-3.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/example/V2A_sample-3.mp4 -------------------------------------------------------------------------------- /example/V2M_sample-1.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/example/V2M_sample-1.mp4 -------------------------------------------------------------------------------- /example/V2M_sample-2.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/example/V2M_sample-2.mp4 -------------------------------------------------------------------------------- /example/V2M_sample-3.mp4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/example/V2M_sample-3.mp4 -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/pyproject.toml -------------------------------------------------------------------------------- /run_gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/run_gradio.py -------------------------------------------------------------------------------- /setup.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/setup.py -------------------------------------------------------------------------------- /stable_audio_tools/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/__init__.py -------------------------------------------------------------------------------- /stable_audio_tools/data/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /stable_audio_tools/data/dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/data/dataset.py -------------------------------------------------------------------------------- /stable_audio_tools/data/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/data/utils.py -------------------------------------------------------------------------------- /stable_audio_tools/inference/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /stable_audio_tools/inference/generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/inference/generation.py -------------------------------------------------------------------------------- /stable_audio_tools/inference/sampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/inference/sampling.py -------------------------------------------------------------------------------- /stable_audio_tools/inference/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/inference/utils.py -------------------------------------------------------------------------------- /stable_audio_tools/interface/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /stable_audio_tools/interface/gradio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/interface/gradio.py -------------------------------------------------------------------------------- /stable_audio_tools/models/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/__init__.py -------------------------------------------------------------------------------- /stable_audio_tools/models/adp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/adp.py -------------------------------------------------------------------------------- /stable_audio_tools/models/autoencoders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/autoencoders.py -------------------------------------------------------------------------------- /stable_audio_tools/models/blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/blocks.py -------------------------------------------------------------------------------- /stable_audio_tools/models/bottleneck.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/bottleneck.py -------------------------------------------------------------------------------- /stable_audio_tools/models/codebook_patterns.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/codebook_patterns.py -------------------------------------------------------------------------------- /stable_audio_tools/models/conditioners.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/conditioners.py -------------------------------------------------------------------------------- /stable_audio_tools/models/diffusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/diffusion.py -------------------------------------------------------------------------------- /stable_audio_tools/models/discriminators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/discriminators.py -------------------------------------------------------------------------------- /stable_audio_tools/models/dit.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/dit.py -------------------------------------------------------------------------------- /stable_audio_tools/models/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/factory.py -------------------------------------------------------------------------------- /stable_audio_tools/models/lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/lm.py -------------------------------------------------------------------------------- /stable_audio_tools/models/local_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/local_attention.py -------------------------------------------------------------------------------- /stable_audio_tools/models/pqmf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/pqmf.py -------------------------------------------------------------------------------- /stable_audio_tools/models/pretrained.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/pretrained.py -------------------------------------------------------------------------------- /stable_audio_tools/models/pretransforms.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/pretransforms.py -------------------------------------------------------------------------------- /stable_audio_tools/models/temptransformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/temptransformer.py -------------------------------------------------------------------------------- /stable_audio_tools/models/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/transformer.py -------------------------------------------------------------------------------- /stable_audio_tools/models/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/utils.py -------------------------------------------------------------------------------- /stable_audio_tools/models/wavelets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/models/wavelets.py -------------------------------------------------------------------------------- /stable_audio_tools/training/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/__init__.py -------------------------------------------------------------------------------- /stable_audio_tools/training/autoencoders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/autoencoders.py -------------------------------------------------------------------------------- /stable_audio_tools/training/diffusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/diffusion.py -------------------------------------------------------------------------------- /stable_audio_tools/training/factory.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/factory.py -------------------------------------------------------------------------------- /stable_audio_tools/training/lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/lm.py -------------------------------------------------------------------------------- /stable_audio_tools/training/losses/__init__.py: -------------------------------------------------------------------------------- 1 | from .losses import * -------------------------------------------------------------------------------- /stable_audio_tools/training/losses/auraloss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/losses/auraloss.py -------------------------------------------------------------------------------- /stable_audio_tools/training/losses/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/losses/losses.py -------------------------------------------------------------------------------- /stable_audio_tools/training/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/ZeyueT/AudioX/HEAD/stable_audio_tools/training/utils.py --------------------------------------------------------------------------------