├── .gitignore ├── LICENSE ├── README.md ├── audio ├── __init__.py ├── audio_processing.py ├── stft.py └── tools.py ├── config └── LibriTTS │ ├── model.yaml │ ├── preprocess.yaml │ └── train.yaml ├── dataset.py ├── demo └── LibriTTS │ ├── references │ ├── 0_19_198_000000_000000.lab │ ├── 0_19_198_000000_000000.wav │ ├── 1_26_495_000004_000000.lab │ ├── 1_26_495_000004_000000.wav │ ├── 2_27_123349_000001_000000.lab │ ├── 2_27_123349_000001_000000.wav │ ├── 3_32_4137_000005_000001.lab │ ├── 3_32_4137_000005_000001.wav │ ├── 4_39_121916_000015_000005.lab │ ├── 4_39_121916_000015_000005.wav │ ├── 5_40_222_000001_000000.lab │ └── 5_40_222_000001_000000.wav │ └── results │ ├── 0_the two children therefore got up, dressed themselves quickly, and went away..png │ ├── 0_the two children therefore got up, dressed themselves quickly, and went away..wav │ ├── 1_the two children therefore got up, dressed themselves quickly, and went away..png │ ├── 1_the two children therefore got up, dressed themselves quickly, and went away..wav │ ├── 2_the two children therefore got up, dressed themselves quickly, and went away..png │ ├── 2_the two children therefore got up, dressed themselves quickly, and went away..wav │ ├── 3_the two children therefore got up, dressed themselves quickly, and went away..png │ ├── 3_the two children therefore got up, dressed themselves quickly, and went away..wav │ ├── 4_the two children therefore got up, dressed themselves quickly, and went away..png │ ├── 4_the two children therefore got up, dressed themselves quickly, and went away..wav │ ├── 5_the two children therefore got up, dressed themselves quickly, and went away..png │ └── 5_the two children therefore got up, dressed themselves quickly, and went away..wav ├── evaluate.py ├── filelist_filtering.py ├── hifigan ├── LICENSE ├── __init__.py ├── config.json ├── generator_LJSpeech.pth.tar.zip ├── generator_universal.pth.tar.zip └── models.py ├── img ├── model_1.png ├── model_2.png ├── tensorboard_audio.png ├── tensorboard_loss.png └── tensorboard_spec.png ├── lexicon ├── librispeech-lexicon.txt └── pinyin-lexicon-r.txt ├── model ├── StyleSpeech.py ├── __init__.py ├── blocks.py ├── loss.py ├── modules.py └── optimizer.py ├── prepare_align.py ├── preprocess.py ├── preprocessed_data └── LibriTTS │ ├── speakers.json │ ├── stats.json │ ├── train.txt │ ├── train_filtered.txt │ └── val.txt ├── preprocessor ├── aishell3.py ├── libritts.py ├── ljspeech.py └── preprocessor.py ├── requirements.txt ├── synthesize.py ├── text ├── __init__.py ├── cleaners.py ├── cmudict.py ├── numbers.py ├── pinyin.py └── symbols.py ├── train.py └── utils ├── model.py └── tools.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/README.md -------------------------------------------------------------------------------- /audio/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/audio/__init__.py -------------------------------------------------------------------------------- /audio/audio_processing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/audio/audio_processing.py -------------------------------------------------------------------------------- /audio/stft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/audio/stft.py -------------------------------------------------------------------------------- /audio/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/audio/tools.py -------------------------------------------------------------------------------- /config/LibriTTS/model.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/config/LibriTTS/model.yaml -------------------------------------------------------------------------------- /config/LibriTTS/preprocess.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/config/LibriTTS/preprocess.yaml -------------------------------------------------------------------------------- /config/LibriTTS/train.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/config/LibriTTS/train.yaml -------------------------------------------------------------------------------- /dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/dataset.py -------------------------------------------------------------------------------- /demo/LibriTTS/references/0_19_198_000000_000000.lab: -------------------------------------------------------------------------------- 1 | this is a librivox recording. -------------------------------------------------------------------------------- /demo/LibriTTS/references/0_19_198_000000_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/0_19_198_000000_000000.wav -------------------------------------------------------------------------------- /demo/LibriTTS/references/1_26_495_000004_000000.lab: -------------------------------------------------------------------------------- 1 | by daniel defoe -------------------------------------------------------------------------------- /demo/LibriTTS/references/1_26_495_000004_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/1_26_495_000004_000000.wav -------------------------------------------------------------------------------- /demo/LibriTTS/references/2_27_123349_000001_000000.lab: -------------------------------------------------------------------------------- 1 | at length all differences were compromised. -------------------------------------------------------------------------------- /demo/LibriTTS/references/2_27_123349_000001_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/2_27_123349_000001_000000.wav -------------------------------------------------------------------------------- /demo/LibriTTS/references/3_32_4137_000005_000001.lab: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/3_32_4137_000005_000001.lab -------------------------------------------------------------------------------- /demo/LibriTTS/references/3_32_4137_000005_000001.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/3_32_4137_000005_000001.wav -------------------------------------------------------------------------------- /demo/LibriTTS/references/4_39_121916_000015_000005.lab: -------------------------------------------------------------------------------- 1 | ours are all apple tarts. -------------------------------------------------------------------------------- /demo/LibriTTS/references/4_39_121916_000015_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/4_39_121916_000015_000005.wav -------------------------------------------------------------------------------- /demo/LibriTTS/references/5_40_222_000001_000000.lab: -------------------------------------------------------------------------------- 1 | chapter twenty five -------------------------------------------------------------------------------- /demo/LibriTTS/references/5_40_222_000001_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/references/5_40_222_000001_000000.wav -------------------------------------------------------------------------------- /demo/LibriTTS/results/0_the two children therefore got up, dressed themselves quickly, and went away..png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/0_the two children therefore got up, dressed themselves quickly, and went away..png -------------------------------------------------------------------------------- /demo/LibriTTS/results/0_the two children therefore got up, dressed themselves quickly, and went away..wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/0_the two children therefore got up, dressed themselves quickly, and went away..wav -------------------------------------------------------------------------------- /demo/LibriTTS/results/1_the two children therefore got up, dressed themselves quickly, and went away..png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/1_the two children therefore got up, dressed themselves quickly, and went away..png -------------------------------------------------------------------------------- /demo/LibriTTS/results/1_the two children therefore got up, dressed themselves quickly, and went away..wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/1_the two children therefore got up, dressed themselves quickly, and went away..wav -------------------------------------------------------------------------------- /demo/LibriTTS/results/2_the two children therefore got up, dressed themselves quickly, and went away..png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/2_the two children therefore got up, dressed themselves quickly, and went away..png -------------------------------------------------------------------------------- /demo/LibriTTS/results/2_the two children therefore got up, dressed themselves quickly, and went away..wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/2_the two children therefore got up, dressed themselves quickly, and went away..wav -------------------------------------------------------------------------------- /demo/LibriTTS/results/3_the two children therefore got up, dressed themselves quickly, and went away..png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/3_the two children therefore got up, dressed themselves quickly, and went away..png -------------------------------------------------------------------------------- /demo/LibriTTS/results/3_the two children therefore got up, dressed themselves quickly, and went away..wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/3_the two children therefore got up, dressed themselves quickly, and went away..wav -------------------------------------------------------------------------------- /demo/LibriTTS/results/4_the two children therefore got up, dressed themselves quickly, and went away..png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/4_the two children therefore got up, dressed themselves quickly, and went away..png -------------------------------------------------------------------------------- /demo/LibriTTS/results/4_the two children therefore got up, dressed themselves quickly, and went away..wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/4_the two children therefore got up, dressed themselves quickly, and went away..wav -------------------------------------------------------------------------------- /demo/LibriTTS/results/5_the two children therefore got up, dressed themselves quickly, and went away..png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/5_the two children therefore got up, dressed themselves quickly, and went away..png -------------------------------------------------------------------------------- /demo/LibriTTS/results/5_the two children therefore got up, dressed themselves quickly, and went away..wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/demo/LibriTTS/results/5_the two children therefore got up, dressed themselves quickly, and went away..wav -------------------------------------------------------------------------------- /evaluate.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/evaluate.py -------------------------------------------------------------------------------- /filelist_filtering.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/filelist_filtering.py -------------------------------------------------------------------------------- /hifigan/LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/hifigan/LICENSE -------------------------------------------------------------------------------- /hifigan/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/hifigan/__init__.py -------------------------------------------------------------------------------- /hifigan/config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/hifigan/config.json -------------------------------------------------------------------------------- /hifigan/generator_LJSpeech.pth.tar.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/hifigan/generator_LJSpeech.pth.tar.zip -------------------------------------------------------------------------------- /hifigan/generator_universal.pth.tar.zip: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/hifigan/generator_universal.pth.tar.zip -------------------------------------------------------------------------------- /hifigan/models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/hifigan/models.py -------------------------------------------------------------------------------- /img/model_1.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/img/model_1.png -------------------------------------------------------------------------------- /img/model_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/img/model_2.png -------------------------------------------------------------------------------- /img/tensorboard_audio.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/img/tensorboard_audio.png -------------------------------------------------------------------------------- /img/tensorboard_loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/img/tensorboard_loss.png -------------------------------------------------------------------------------- /img/tensorboard_spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/img/tensorboard_spec.png -------------------------------------------------------------------------------- /lexicon/librispeech-lexicon.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/lexicon/librispeech-lexicon.txt -------------------------------------------------------------------------------- /lexicon/pinyin-lexicon-r.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/lexicon/pinyin-lexicon-r.txt -------------------------------------------------------------------------------- /model/StyleSpeech.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/model/StyleSpeech.py -------------------------------------------------------------------------------- /model/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/model/__init__.py -------------------------------------------------------------------------------- /model/blocks.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/model/blocks.py -------------------------------------------------------------------------------- /model/loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/model/loss.py -------------------------------------------------------------------------------- /model/modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/model/modules.py -------------------------------------------------------------------------------- /model/optimizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/model/optimizer.py -------------------------------------------------------------------------------- /prepare_align.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/prepare_align.py -------------------------------------------------------------------------------- /preprocess.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocess.py -------------------------------------------------------------------------------- /preprocessed_data/LibriTTS/speakers.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessed_data/LibriTTS/speakers.json -------------------------------------------------------------------------------- /preprocessed_data/LibriTTS/stats.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessed_data/LibriTTS/stats.json -------------------------------------------------------------------------------- /preprocessed_data/LibriTTS/train.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessed_data/LibriTTS/train.txt -------------------------------------------------------------------------------- /preprocessed_data/LibriTTS/train_filtered.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessed_data/LibriTTS/train_filtered.txt -------------------------------------------------------------------------------- /preprocessed_data/LibriTTS/val.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessed_data/LibriTTS/val.txt -------------------------------------------------------------------------------- /preprocessor/aishell3.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessor/aishell3.py -------------------------------------------------------------------------------- /preprocessor/libritts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessor/libritts.py -------------------------------------------------------------------------------- /preprocessor/ljspeech.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessor/ljspeech.py -------------------------------------------------------------------------------- /preprocessor/preprocessor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/preprocessor/preprocessor.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/requirements.txt -------------------------------------------------------------------------------- /synthesize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/synthesize.py -------------------------------------------------------------------------------- /text/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/text/__init__.py -------------------------------------------------------------------------------- /text/cleaners.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/text/cleaners.py -------------------------------------------------------------------------------- /text/cmudict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/text/cmudict.py -------------------------------------------------------------------------------- /text/numbers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/text/numbers.py -------------------------------------------------------------------------------- /text/pinyin.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/text/pinyin.py -------------------------------------------------------------------------------- /text/symbols.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/text/symbols.py -------------------------------------------------------------------------------- /train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/train.py -------------------------------------------------------------------------------- /utils/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/utils/model.py -------------------------------------------------------------------------------- /utils/tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/keonlee9420/StyleSpeech/HEAD/utils/tools.py --------------------------------------------------------------------------------