├── .flake8 ├── .gitignore ├── LICENSE ├── README.md ├── __init__.py ├── constants.py ├── data ├── collation.py ├── data_module.py ├── sampler.py ├── semantic_dataset.py └── single_speaker_dataset.py ├── datasets └── example │ └── train.json ├── demo ├── audios-speech-tokenizer │ ├── acoustic │ │ ├── POD0000004393_S0000029.npy │ │ ├── POD0000007005_S0000568.npy │ │ ├── POD0000009720_S0000244.npy │ │ ├── POD0000014360_S0000082.npy │ │ ├── POD0000015908_S0000037.npy │ │ ├── POD1000000022_S0000028.npy │ │ └── male_voice.npy │ └── semantic │ │ ├── POD0000004393_S0000029.npy │ │ ├── POD0000007005_S0000568.npy │ │ ├── POD0000009720_S0000244.npy │ │ ├── POD0000014360_S0000082.npy │ │ ├── POD0000015908_S0000037.npy │ │ ├── POD1000000022_S0000028.npy │ │ └── male_voice.npy ├── audios │ ├── POD0000004393_S0000029.wav │ ├── POD0000007005_S0000568.wav │ ├── POD0000009720_S0000244.wav │ ├── POD0000014360_S0000082.wav │ ├── POD0000015908_S0000037.wav │ ├── POD1000000022_S0000028.wav │ └── male_voice.wav ├── male_voice.wav └── manifest.json ├── docs ├── _config.yml ├── _layouts │ └── default.html ├── assets │ ├── css │ │ └── style.scss │ └── img │ │ └── polyai-logo.webp ├── index.md └── samples │ ├── empress │ ├── 114.wav │ ├── 148.wav │ ├── 161.wav │ ├── 189.wav │ ├── 217.wav │ ├── 226.wav │ ├── 234.wav │ ├── 242.wav │ ├── 262.wav │ ├── 269.wav │ ├── 29.wav │ └── 46.wav │ ├── gigaspeech │ ├── POD1000000004_S0000246.wav │ ├── POD1000000004_S0000247.wav │ ├── POD1000000018_S0000253.wav │ ├── POD1000000018_S0000254.wav │ ├── POD1000000048_S0000035.wav │ ├── POD1000000048_S0000036.wav │ ├── YOU1000000006_S0000051.wav │ ├── YOU1000000006_S0000052.wav │ ├── YOU1000000044_S0000798.wav │ └── YOU1000000044_S0000799.wav │ ├── pheme-100 │ ├── 019.wav │ ├── 042.wav │ ├── 080.wav │ ├── 188.wav │ └── 209.wav │ ├── pheme-300 │ ├── 019.wav │ ├── 042.wav │ ├── 080.wav │ ├── 188.wav │ └── 209.wav │ ├── pheme-empress-300 │ ├── 001.wav │ ├── 002.wav │ ├── 190.wav │ ├── 227.wav │ ├── 235.wav │ ├── 243.wav │ └── 270.wav │ ├── pheme-no-empress-300 │ ├── 190.wav │ ├── 227.wav │ ├── 235.wav │ ├── 243.wav │ └── 270.wav │ └── pheme-no-spkr-300 │ ├── 019.wav │ ├── 042.wav │ ├── 080.wav │ ├── 188.wav │ └── 209.wav ├── modules ├── __init__.py ├── conformer.py ├── masking_logic.py ├── s2a_model.py ├── speech_tokenizer.py ├── t2s_model.py ├── tokenizer.py └── vocoder.py ├── requirements.txt ├── train_s2a.py ├── train_t2s.py ├── transformer_infer.py └── utils ├── __init__.py ├── data_prep.py ├── get_tokens_speech_tokenizer.py └── symbol_table.py /.flake8: -------------------------------------------------------------------------------- 1 | [flake8] 2 | max-line-length = 88 3 | exclude = .git,__pycache__,build,dist 4 | -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/README.md -------------------------------------------------------------------------------- /__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /constants.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/constants.py -------------------------------------------------------------------------------- /data/collation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/data/collation.py -------------------------------------------------------------------------------- /data/data_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/data/data_module.py -------------------------------------------------------------------------------- /data/sampler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/data/sampler.py -------------------------------------------------------------------------------- /data/semantic_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/data/semantic_dataset.py -------------------------------------------------------------------------------- /data/single_speaker_dataset.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/data/single_speaker_dataset.py -------------------------------------------------------------------------------- /datasets/example/train.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/datasets/example/train.json -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/POD0000004393_S0000029.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/POD0000004393_S0000029.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/POD0000007005_S0000568.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/POD0000007005_S0000568.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/POD0000009720_S0000244.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/POD0000009720_S0000244.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/POD0000014360_S0000082.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/POD0000014360_S0000082.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/POD0000015908_S0000037.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/POD0000015908_S0000037.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/POD1000000022_S0000028.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/POD1000000022_S0000028.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/acoustic/male_voice.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/acoustic/male_voice.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/POD0000004393_S0000029.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/POD0000004393_S0000029.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/POD0000007005_S0000568.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/POD0000007005_S0000568.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/POD0000009720_S0000244.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/POD0000009720_S0000244.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/POD0000014360_S0000082.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/POD0000014360_S0000082.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/POD0000015908_S0000037.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/POD0000015908_S0000037.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/POD1000000022_S0000028.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/POD1000000022_S0000028.npy -------------------------------------------------------------------------------- /demo/audios-speech-tokenizer/semantic/male_voice.npy: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios-speech-tokenizer/semantic/male_voice.npy -------------------------------------------------------------------------------- /demo/audios/POD0000004393_S0000029.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/POD0000004393_S0000029.wav -------------------------------------------------------------------------------- /demo/audios/POD0000007005_S0000568.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/POD0000007005_S0000568.wav -------------------------------------------------------------------------------- /demo/audios/POD0000009720_S0000244.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/POD0000009720_S0000244.wav -------------------------------------------------------------------------------- /demo/audios/POD0000014360_S0000082.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/POD0000014360_S0000082.wav -------------------------------------------------------------------------------- /demo/audios/POD0000015908_S0000037.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/POD0000015908_S0000037.wav -------------------------------------------------------------------------------- /demo/audios/POD1000000022_S0000028.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/POD1000000022_S0000028.wav -------------------------------------------------------------------------------- /demo/audios/male_voice.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/audios/male_voice.wav -------------------------------------------------------------------------------- /demo/male_voice.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/male_voice.wav -------------------------------------------------------------------------------- /demo/manifest.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/demo/manifest.json -------------------------------------------------------------------------------- /docs/_config.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/_config.yml -------------------------------------------------------------------------------- /docs/_layouts/default.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/_layouts/default.html -------------------------------------------------------------------------------- /docs/assets/css/style.scss: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/assets/css/style.scss -------------------------------------------------------------------------------- /docs/assets/img/polyai-logo.webp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/assets/img/polyai-logo.webp -------------------------------------------------------------------------------- /docs/index.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/index.md -------------------------------------------------------------------------------- /docs/samples/empress/114.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/114.wav -------------------------------------------------------------------------------- /docs/samples/empress/148.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/148.wav -------------------------------------------------------------------------------- /docs/samples/empress/161.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/161.wav -------------------------------------------------------------------------------- /docs/samples/empress/189.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/189.wav -------------------------------------------------------------------------------- /docs/samples/empress/217.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/217.wav -------------------------------------------------------------------------------- /docs/samples/empress/226.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/226.wav -------------------------------------------------------------------------------- /docs/samples/empress/234.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/234.wav -------------------------------------------------------------------------------- /docs/samples/empress/242.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/242.wav -------------------------------------------------------------------------------- /docs/samples/empress/262.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/262.wav -------------------------------------------------------------------------------- /docs/samples/empress/269.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/269.wav -------------------------------------------------------------------------------- /docs/samples/empress/29.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/29.wav -------------------------------------------------------------------------------- /docs/samples/empress/46.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/empress/46.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/POD1000000004_S0000246.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/POD1000000004_S0000246.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/POD1000000004_S0000247.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/POD1000000004_S0000247.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/POD1000000018_S0000253.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/POD1000000018_S0000253.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/POD1000000018_S0000254.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/POD1000000018_S0000254.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/POD1000000048_S0000035.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/POD1000000048_S0000035.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/POD1000000048_S0000036.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/POD1000000048_S0000036.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/YOU1000000006_S0000051.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/YOU1000000006_S0000051.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/YOU1000000006_S0000052.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/YOU1000000006_S0000052.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/YOU1000000044_S0000798.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/YOU1000000044_S0000798.wav -------------------------------------------------------------------------------- /docs/samples/gigaspeech/YOU1000000044_S0000799.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/gigaspeech/YOU1000000044_S0000799.wav -------------------------------------------------------------------------------- /docs/samples/pheme-100/019.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-100/019.wav -------------------------------------------------------------------------------- /docs/samples/pheme-100/042.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-100/042.wav -------------------------------------------------------------------------------- /docs/samples/pheme-100/080.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-100/080.wav -------------------------------------------------------------------------------- /docs/samples/pheme-100/188.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-100/188.wav -------------------------------------------------------------------------------- /docs/samples/pheme-100/209.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-100/209.wav -------------------------------------------------------------------------------- /docs/samples/pheme-300/019.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-300/019.wav -------------------------------------------------------------------------------- /docs/samples/pheme-300/042.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-300/042.wav -------------------------------------------------------------------------------- /docs/samples/pheme-300/080.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-300/080.wav -------------------------------------------------------------------------------- /docs/samples/pheme-300/188.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-300/188.wav -------------------------------------------------------------------------------- /docs/samples/pheme-300/209.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-300/209.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/001.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/001.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/002.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/190.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/190.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/227.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/227.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/235.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/235.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/243.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/243.wav -------------------------------------------------------------------------------- /docs/samples/pheme-empress-300/270.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-empress-300/270.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-empress-300/190.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-empress-300/190.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-empress-300/227.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-empress-300/227.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-empress-300/235.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-empress-300/235.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-empress-300/243.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-empress-300/243.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-empress-300/270.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-empress-300/270.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-spkr-300/019.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-spkr-300/019.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-spkr-300/042.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-spkr-300/042.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-spkr-300/080.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-spkr-300/080.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-spkr-300/188.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-spkr-300/188.wav -------------------------------------------------------------------------------- /docs/samples/pheme-no-spkr-300/209.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/docs/samples/pheme-no-spkr-300/209.wav -------------------------------------------------------------------------------- /modules/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /modules/conformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/conformer.py -------------------------------------------------------------------------------- /modules/masking_logic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/masking_logic.py -------------------------------------------------------------------------------- /modules/s2a_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/s2a_model.py -------------------------------------------------------------------------------- /modules/speech_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/speech_tokenizer.py -------------------------------------------------------------------------------- /modules/t2s_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/t2s_model.py -------------------------------------------------------------------------------- /modules/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/tokenizer.py -------------------------------------------------------------------------------- /modules/vocoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/modules/vocoder.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/requirements.txt -------------------------------------------------------------------------------- /train_s2a.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/train_s2a.py -------------------------------------------------------------------------------- /train_t2s.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/train_t2s.py -------------------------------------------------------------------------------- /transformer_infer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/transformer_infer.py -------------------------------------------------------------------------------- /utils/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/utils/__init__.py -------------------------------------------------------------------------------- /utils/data_prep.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/utils/data_prep.py -------------------------------------------------------------------------------- /utils/get_tokens_speech_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/utils/get_tokens_speech_tokenizer.py -------------------------------------------------------------------------------- /utils/symbol_table.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/PolyAI-LDN/pheme/HEAD/utils/symbol_table.py --------------------------------------------------------------------------------