├── .envrc ├── .github ├── pull_request_template.md └── workflows │ └── linter.yaml ├── .gitignore ├── .pre-commit-config.yaml ├── .tool-versions ├── CONTRIBUTING.md ├── LICENSE ├── Makefile ├── README.md ├── example ├── codec │ └── model_config.json └── configs │ ├── codec_training_config.json │ ├── rlhf.json │ ├── samples.jsonl │ └── sft.json ├── pyproject.toml ├── setup └── setup_python.sh ├── tools ├── data │ ├── data_merger.py │ └── data_vectorizer.py └── serving │ ├── convert_checkpoint.py │ └── inference.py ├── tts ├── __init__.py ├── core │ ├── codec │ │ ├── activations.py │ │ ├── criterion.py │ │ ├── decoder.py │ │ ├── decoder_modules.py │ │ ├── decoding.py │ │ ├── discriminator.py │ │ ├── encoder.py │ │ ├── encoder_modules.py │ │ ├── encoding.py │ │ ├── filters.py │ │ └── upsampler.py │ ├── constants.py │ ├── lora.py │ ├── modeling.py │ ├── optimization.py │ ├── prompting.py │ └── tokenization.py ├── data │ ├── caching.py │ ├── data_sample.py │ ├── data_utils.py │ ├── datasets │ │ ├── finetuning.py │ │ ├── pretraining.py │ │ └── rlhf.py │ ├── filtering.py │ ├── text_normalization.py │ └── tts_datasets.py ├── inference │ ├── inferencing.py │ └── quality_validation.py ├── training │ ├── checkpointing.py │ ├── codec │ │ ├── codec_datasets.py │ │ ├── codec_quality_validation.py │ │ ├── gan_training_loop.py │ │ └── train_codec.py │ ├── environment.py │ ├── evaluation.py │ ├── main.py │ ├── rlhf │ │ ├── ecapa_tdnn.py │ │ ├── reward_utils.py │ │ ├── rewards.py │ │ ├── rlhf_main.py │ │ └── run_rlhf_combine.sh │ └── training_loop.py └── utils │ ├── configuration.py │ └── custom_logging.py └── uv.lock /.envrc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/.envrc -------------------------------------------------------------------------------- /.github/pull_request_template.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/.github/pull_request_template.md -------------------------------------------------------------------------------- /.github/workflows/linter.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/.github/workflows/linter.yaml -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/.gitignore -------------------------------------------------------------------------------- /.pre-commit-config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/.pre-commit-config.yaml -------------------------------------------------------------------------------- /.tool-versions: -------------------------------------------------------------------------------- 1 | python 3.10.12 2 | uv 0.6.9 3 | -------------------------------------------------------------------------------- /CONTRIBUTING.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/CONTRIBUTING.md -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/LICENSE -------------------------------------------------------------------------------- /Makefile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/Makefile -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/README.md -------------------------------------------------------------------------------- /example/codec/model_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/example/codec/model_config.json -------------------------------------------------------------------------------- /example/configs/codec_training_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/example/configs/codec_training_config.json -------------------------------------------------------------------------------- /example/configs/rlhf.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/example/configs/rlhf.json -------------------------------------------------------------------------------- /example/configs/samples.jsonl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/example/configs/samples.jsonl -------------------------------------------------------------------------------- /example/configs/sft.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/example/configs/sft.json -------------------------------------------------------------------------------- /pyproject.toml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/pyproject.toml -------------------------------------------------------------------------------- /setup/setup_python.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/setup/setup_python.sh -------------------------------------------------------------------------------- /tools/data/data_merger.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tools/data/data_merger.py -------------------------------------------------------------------------------- /tools/data/data_vectorizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tools/data/data_vectorizer.py -------------------------------------------------------------------------------- /tools/serving/convert_checkpoint.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tools/serving/convert_checkpoint.py -------------------------------------------------------------------------------- /tools/serving/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tools/serving/inference.py -------------------------------------------------------------------------------- /tts/__init__.py: -------------------------------------------------------------------------------- 1 | __version__ = "0.0.1" 2 | -------------------------------------------------------------------------------- /tts/core/codec/activations.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/activations.py -------------------------------------------------------------------------------- /tts/core/codec/criterion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/criterion.py -------------------------------------------------------------------------------- /tts/core/codec/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/decoder.py -------------------------------------------------------------------------------- /tts/core/codec/decoder_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/decoder_modules.py -------------------------------------------------------------------------------- /tts/core/codec/decoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/decoding.py -------------------------------------------------------------------------------- /tts/core/codec/discriminator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/discriminator.py -------------------------------------------------------------------------------- /tts/core/codec/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/encoder.py -------------------------------------------------------------------------------- /tts/core/codec/encoder_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/encoder_modules.py -------------------------------------------------------------------------------- /tts/core/codec/encoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/encoding.py -------------------------------------------------------------------------------- /tts/core/codec/filters.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/filters.py -------------------------------------------------------------------------------- /tts/core/codec/upsampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/codec/upsampler.py -------------------------------------------------------------------------------- /tts/core/constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/constants.py -------------------------------------------------------------------------------- /tts/core/lora.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/lora.py -------------------------------------------------------------------------------- /tts/core/modeling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/modeling.py -------------------------------------------------------------------------------- /tts/core/optimization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/optimization.py -------------------------------------------------------------------------------- /tts/core/prompting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/prompting.py -------------------------------------------------------------------------------- /tts/core/tokenization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/core/tokenization.py -------------------------------------------------------------------------------- /tts/data/caching.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/caching.py -------------------------------------------------------------------------------- /tts/data/data_sample.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/data_sample.py -------------------------------------------------------------------------------- /tts/data/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/data_utils.py -------------------------------------------------------------------------------- /tts/data/datasets/finetuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/datasets/finetuning.py -------------------------------------------------------------------------------- /tts/data/datasets/pretraining.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/datasets/pretraining.py -------------------------------------------------------------------------------- /tts/data/datasets/rlhf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/datasets/rlhf.py -------------------------------------------------------------------------------- /tts/data/filtering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/filtering.py -------------------------------------------------------------------------------- /tts/data/text_normalization.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/text_normalization.py -------------------------------------------------------------------------------- /tts/data/tts_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/data/tts_datasets.py -------------------------------------------------------------------------------- /tts/inference/inferencing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/inference/inferencing.py -------------------------------------------------------------------------------- /tts/inference/quality_validation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/inference/quality_validation.py -------------------------------------------------------------------------------- /tts/training/checkpointing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/checkpointing.py -------------------------------------------------------------------------------- /tts/training/codec/codec_datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/codec/codec_datasets.py -------------------------------------------------------------------------------- /tts/training/codec/codec_quality_validation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/codec/codec_quality_validation.py -------------------------------------------------------------------------------- /tts/training/codec/gan_training_loop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/codec/gan_training_loop.py -------------------------------------------------------------------------------- /tts/training/codec/train_codec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/codec/train_codec.py -------------------------------------------------------------------------------- /tts/training/environment.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/environment.py -------------------------------------------------------------------------------- /tts/training/evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/evaluation.py -------------------------------------------------------------------------------- /tts/training/main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/main.py -------------------------------------------------------------------------------- /tts/training/rlhf/ecapa_tdnn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/rlhf/ecapa_tdnn.py -------------------------------------------------------------------------------- /tts/training/rlhf/reward_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/rlhf/reward_utils.py -------------------------------------------------------------------------------- /tts/training/rlhf/rewards.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/rlhf/rewards.py -------------------------------------------------------------------------------- /tts/training/rlhf/rlhf_main.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/rlhf/rlhf_main.py -------------------------------------------------------------------------------- /tts/training/rlhf/run_rlhf_combine.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/rlhf/run_rlhf_combine.sh -------------------------------------------------------------------------------- /tts/training/training_loop.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/training/training_loop.py -------------------------------------------------------------------------------- /tts/utils/configuration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/utils/configuration.py -------------------------------------------------------------------------------- /tts/utils/custom_logging.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/tts/utils/custom_logging.py -------------------------------------------------------------------------------- /uv.lock: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/inworld-ai/tts/HEAD/uv.lock --------------------------------------------------------------------------------