├── .gitattributes ├── .gitignore ├── README.md ├── cmd.sh ├── configs ├── lj_16k_gt_dur.yaml └── lj_16k_gt_dur_reflow.yaml ├── data └── ljspeech │ └── example │ ├── phn_duration │ ├── text │ ├── utt2spk │ ├── utts.list │ └── wav.scp ├── data_collate.py ├── data_loader.py ├── extract_fbank.sh ├── feats └── fbank │ └── ljspeech │ └── train │ └── cmvn.ark ├── generate_for_reflow.py ├── hifigan ├── README.md ├── cmd.sh ├── generation.sh ├── parallel_wavegan │ ├── __init__.py │ ├── bin │ │ ├── __init__.py │ │ ├── compute_statistics.py │ │ ├── decode.py │ │ ├── normalize.py │ │ ├── preprocess.py │ │ └── train.py │ ├── datasets │ │ ├── __init__.py │ │ ├── audio_mel_dataset.py │ │ └── scp_dataset.py │ ├── distributed │ │ ├── __init__.py │ │ └── launch.py │ ├── hh │ ├── layers │ │ ├── __init__.py │ │ ├── causal_conv.py │ │ ├── pqmf.py │ │ ├── residual_block.py │ │ ├── residual_stack.py │ │ ├── tade_res_block.py │ │ ├── tf_layers.py │ │ └── upsample.py │ ├── losses │ │ ├── __init__.py │ │ ├── adversarial_loss.py │ │ ├── feat_match_loss.py │ │ ├── mel_loss.py │ │ └── stft_loss.py │ ├── models │ │ ├── __init__.py │ │ ├── hifigan.py │ │ ├── melgan.py │ │ ├── parallel_wavegan.py │ │ ├── style_melgan.py │ │ └── tf_models.py │ ├── optimizers │ │ ├── __init__.py │ │ └── radam.py │ └── utils │ │ ├── __init__.py │ │ └── utils.py └── utils ├── inference_dataset.py ├── model ├── __init__.py ├── base.py ├── cfm.py ├── diffsinger.py ├── diffusion.py ├── monotonic_align │ ├── LICENCE │ ├── __init__.py │ ├── core.c │ ├── core.pyx │ └── setup.py ├── optimal_transport.py ├── text_encoder.py ├── tts.py └── utils.py ├── path.sh ├── requirements.txt ├── resources └── traj.png ├── tools.py ├── torchdyn ├── __init__.py ├── core │ ├── __init__.py │ ├── defunc.py │ ├── neuralde.py │ ├── problems.py │ └── utils.py ├── datasets │ ├── __init__.py │ └── static_datasets.py ├── models │ ├── README.md │ ├── __init__.py │ ├── cnf.py │ ├── energy.py │ └── hybrid.py ├── nn │ ├── __init__.py │ ├── galerkin.py │ └── node_layers.py ├── numerics │ ├── __init__.py │ ├── interpolators.py │ ├── odeint.py │ ├── sensitivity.py │ ├── solvers │ │ ├── _constants.py │ │ ├── hyper.py │ │ ├── ode.py │ │ ├── root.py │ │ ├── sde.py │ │ └── templates.py │ ├── systems.py │ └── utils.py └── utils.py ├── train.py └── utils ├── apply-cmvn.py ├── compute-cmvn-stats.py ├── compute-fbank-feats.py ├── copy-feats.py ├── custom_librosa ├── __init__.py ├── _cache.py ├── beat.py ├── core │ ├── __init__.py │ ├── audio.py │ ├── constantq.py │ ├── convert.py │ ├── fft.py │ ├── harmonic.py │ ├── notation.py │ ├── pitch.py │ └── spectrum.py ├── decompose.py ├── display.py ├── effects.py ├── feature │ ├── __init__.py │ ├── inverse.py │ ├── rhythm.py │ ├── spectral.py │ └── utils.py ├── filters.py ├── onset.py ├── segment.py ├── sequence.py ├── util │ ├── __init__.py │ ├── _nnls.py │ ├── decorators.py │ ├── deprecation.py │ ├── example_data │ │ ├── index.json │ │ └── registry.txt │ ├── exceptions.py │ ├── files.py │ ├── matching.py │ └── utils.py └── version.py ├── espnet_transform ├── add_deltas.py ├── channel_selector.py ├── cmvn.py ├── functional.py ├── perturb.py ├── spec_augment.py ├── spectrogram.py ├── transform_interface.py ├── transformation.py └── wpe.py ├── espnet_utils ├── cli_readers.py ├── cli_utils.py ├── cli_writers.py ├── dynamic_import.py └── io_utils.py ├── feat-to-len.py ├── feat-to-shape.py ├── filter_scp.pl ├── fix_data_dir.sh ├── make_fbank.sh ├── make_utt2spk_id.py ├── parse_options.sh ├── paste-feats.py ├── run.pl ├── spk2utt_to_utt2spk.pl ├── split_scp.pl ├── subset_data_dir.sh ├── subset_scp.pl ├── utt2spk_to_spk2utt.pl └── validate_data_dir.sh /.gitattributes: -------------------------------------------------------------------------------- 1 | # Auto detect text files and perform LF normalization 2 | * text=auto 3 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | # Byte-compiled / optimized / DLL files 2 | __pycache__/ 3 | *.py[cod] 4 | *$py.class 5 | 6 | # C extensions 7 | *.so 8 | 9 | # Distribution / packaging 10 | .Python 11 | build/ 12 | develop-eggs/ 13 | dist/ 14 | downloads/ 15 | eggs/ 16 | .eggs/ 17 | lib/ 18 | lib64/ 19 | parts/ 20 | sdist/ 21 | var/ 22 | wheels/ 23 | share/python-wheels/ 24 | *.egg-info/ 25 | .installed.cfg 26 | *.egg 27 | MANIFEST 28 | 29 | # PyInstaller 30 | # Usually these files are written by a python script from a template 31 | # before PyInstaller builds the exe, so as to inject date/other infos into it. 32 | *.manifest 33 | *.spec 34 | 35 | # Installer logs 36 | pip-log.txt 37 | pip-delete-this-directory.txt 38 | 39 | # Unit test / coverage reports 40 | htmlcov/ 41 | .tox/ 42 | .nox/ 43 | .coverage 44 | .coverage.* 45 | .cache 46 | nosetests.xml 47 | coverage.xml 48 | *.cover 49 | *.py,cover 50 | .hypothesis/ 51 | .pytest_cache/ 52 | cover/ 53 | 54 | # Translations 55 | *.mo 56 | *.pot 57 | 58 | # Django stuff: 59 | *.log 60 | local_settings.py 61 | db.sqlite3 62 | db.sqlite3-journal 63 | 64 | # Flask stuff: 65 | instance/ 66 | .webassets-cache 67 | 68 | # Scrapy stuff: 69 | .scrapy 70 | 71 | # Sphinx documentation 72 | docs/_build/ 73 | 74 | # PyBuilder 75 | .pybuilder/ 76 | target/ 77 | 78 | # Jupyter Notebook 79 | .ipynb_checkpoints 80 | 81 | # IPython 82 | profile_default/ 83 | ipython_config.py 84 | 85 | # pyenv 86 | # For a library or package, you might want to ignore these files since the code is 87 | # intended to run in multiple environments; otherwise, check them in: 88 | # .python-version 89 | 90 | # pipenv 91 | # According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control. 92 | # However, in case of collaboration, if having platform-specific dependencies or dependencies 93 | # having no cross-platform support, pipenv may install dependencies that don't work, or not 94 | # install all needed dependencies. 95 | #Pipfile.lock 96 | 97 | # poetry 98 | # Similar to Pipfile.lock, it is generally recommended to include poetry.lock in version control. 99 | # This is especially recommended for binary packages to ensure reproducibility, and is more 100 | # commonly ignored for libraries. 101 | # https://python-poetry.org/docs/basic-usage/#commit-your-poetrylock-file-to-version-control 102 | #poetry.lock 103 | 104 | # PEP 582; used by e.g. github.com/David-OConnor/pyflow 105 | __pypackages__/ 106 | 107 | # Celery stuff 108 | celerybeat-schedule 109 | celerybeat.pid 110 | 111 | # SageMath parsed files 112 | *.sage.py 113 | 114 | # Environments 115 | .env 116 | .venv 117 | env/ 118 | venv/ 119 | ENV/ 120 | env.bak/ 121 | venv.bak/ 122 | 123 | # Spyder project settings 124 | .spyderproject 125 | .spyproject 126 | 127 | # Rope project settings 128 | .ropeproject 129 | 130 | # mkdocs documentation 131 | /site 132 | 133 | # mypy 134 | .mypy_cache/ 135 | .dmypy.json 136 | dmypy.json 137 | 138 | # Pyre type checker 139 | .pyre/ 140 | 141 | # pytype static type analyzer 142 | .pytype/ 143 | 144 | # Cython debug symbols 145 | cython_debug/ 146 | 147 | # PyCharm 148 | # JetBrains specific template is maintainted in a separate JetBrains.gitignore that can 149 | # be found at https://github.com/github/gitignore/blob/main/Global/JetBrains.gitignore 150 | # and can be added to the global gitignore or merged into this file. For a more nuclear 151 | # option (not recommended) you can uncomment the following to ignore the entire idea folder. 152 | .idea/ 153 | synthetic_wav/ 154 | exp/ 155 | **/*.wav 156 | .DS_Store -------------------------------------------------------------------------------- /cmd.sh: -------------------------------------------------------------------------------- 1 | # ====== About run.pl, queue.pl, slurm.pl, and ssh.pl ====== 2 | # Usage: .pl [options] JOB=1: 3 | # e.g. 4 | # run.pl --mem 4G JOB=1:10 echo.JOB.log echo JOB 5 | # 6 | # Options: 7 | # --time