├── .gitignore ├── LICENSE ├── README.md ├── config ├── default_c16.yaml └── default_c32.yaml ├── datasets ├── dataloader.py └── metadata │ ├── libritts_train_clean_360_audiopath_text_sid_train.txt │ └── libritts_train_clean_360_audiopath_text_sid_val.txt ├── docs ├── index.html ├── loss.png ├── model_architecture.png └── samples │ ├── seen │ ├── c16 │ │ ├── 2004_147967_000029_000002.wav │ │ ├── 337_126286_000008_000000.wav │ │ ├── 3537_5704_000008_000005.wav │ │ ├── 5319_84357_000005_000004.wav │ │ ├── 6294_86679_000035_000004.wav │ │ └── 949_134657_000002_000005.wav │ ├── c32 │ │ ├── 2004_147967_000029_000002.wav │ │ ├── 337_126286_000008_000000.wav │ │ ├── 3537_5704_000008_000005.wav │ │ ├── 5319_84357_000005_000004.wav │ │ ├── 6294_86679_000035_000004.wav │ │ └── 949_134657_000002_000005.wav │ ├── ground_truth │ │ ├── 2004_147967_000029_000002.wav │ │ ├── 337_126286_000008_000000.wav │ │ ├── 3537_5704_000008_000005.wav │ │ ├── 5319_84357_000005_000004.wav │ │ ├── 6294_86679_000035_000004.wav │ │ └── 949_134657_000002_000005.wav │ ├── official_c16 │ │ ├── 2004_147967_000029_000002.wav │ │ ├── 337_126286_000008_000000.wav │ │ ├── 3537_5704_000008_000005.wav │ │ ├── 5319_84357_000005_000004.wav │ │ └── 6294_86679_000035_000004.wav │ └── official_c32 │ │ ├── 2004_147967_000029_000002.wav │ │ ├── 337_126286_000008_000000.wav │ │ ├── 3537_5704_000008_000005.wav │ │ ├── 5319_84357_000005_000004.wav │ │ └── 6294_86679_000035_000004.wav │ └── unseen │ ├── c16 │ ├── 1089_134686_000007_000005.wav │ ├── 3575_170457_000037_000002.wav │ ├── 4507_16021_000029_000005.wav │ ├── 7021_85628_000037_000000.wav │ ├── 7176_92135_000006_000005.wav │ └── 8224_274384_000016_000000.wav │ ├── c32 │ ├── 1089_134686_000007_000005.wav │ ├── 3575_170457_000037_000002.wav │ ├── 4507_16021_000029_000005.wav │ ├── 7021_85628_000037_000000.wav │ ├── 7176_92135_000006_000005.wav │ └── 8224_274384_000016_000000.wav │ ├── ground_truth │ ├── 1089_134686_000007_000005.wav │ ├── 3575_170457_000037_000002.wav │ ├── 4507_16021_000029_000005.wav │ ├── 7021_85628_000037_000000.wav │ ├── 7176_92135_000006_000005.wav │ └── 8224_274384_000016_000000.wav │ ├── official_c16 │ ├── 1089_134686_000007_000005.wav │ ├── 3575_170457_000037_000002.wav │ ├── 7021_85628_000037_000000.wav │ ├── 7176_92135_000006_000005.wav │ └── 8224_274384_000016_000000.wav │ └── official_c32 │ ├── 1089_134686_000007_000005.wav │ ├── 3575_170457_000037_000002.wav │ ├── 7021_85628_000037_000000.wav │ ├── 7176_92135_000006_000005.wav │ └── 8224_274384_000016_000000.wav ├── inference.py ├── model ├── discriminator.py ├── generator.py ├── lvcnet.py ├── mpd.py └── mrd.py ├── requirements.txt ├── trainer.py └── utils ├── plotting.py ├── stft.py ├── stft_loss.py ├── train.py ├── utils.py ├── validation.py └── writer.py /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/.gitignore -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/README.md -------------------------------------------------------------------------------- /config/default_c16.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/config/default_c16.yaml -------------------------------------------------------------------------------- /config/default_c32.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/config/default_c32.yaml -------------------------------------------------------------------------------- /datasets/dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/datasets/dataloader.py -------------------------------------------------------------------------------- /datasets/metadata/libritts_train_clean_360_audiopath_text_sid_train.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/datasets/metadata/libritts_train_clean_360_audiopath_text_sid_train.txt -------------------------------------------------------------------------------- /datasets/metadata/libritts_train_clean_360_audiopath_text_sid_val.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/datasets/metadata/libritts_train_clean_360_audiopath_text_sid_val.txt -------------------------------------------------------------------------------- /docs/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/index.html -------------------------------------------------------------------------------- /docs/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/loss.png -------------------------------------------------------------------------------- /docs/model_architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/model_architecture.png -------------------------------------------------------------------------------- /docs/samples/seen/c16/2004_147967_000029_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c16/2004_147967_000029_000002.wav -------------------------------------------------------------------------------- /docs/samples/seen/c16/337_126286_000008_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c16/337_126286_000008_000000.wav -------------------------------------------------------------------------------- /docs/samples/seen/c16/3537_5704_000008_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c16/3537_5704_000008_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/c16/5319_84357_000005_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c16/5319_84357_000005_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/c16/6294_86679_000035_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c16/6294_86679_000035_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/c16/949_134657_000002_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c16/949_134657_000002_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/c32/2004_147967_000029_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c32/2004_147967_000029_000002.wav -------------------------------------------------------------------------------- /docs/samples/seen/c32/337_126286_000008_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c32/337_126286_000008_000000.wav -------------------------------------------------------------------------------- /docs/samples/seen/c32/3537_5704_000008_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c32/3537_5704_000008_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/c32/5319_84357_000005_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c32/5319_84357_000005_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/c32/6294_86679_000035_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c32/6294_86679_000035_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/c32/949_134657_000002_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/c32/949_134657_000002_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/ground_truth/2004_147967_000029_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/ground_truth/2004_147967_000029_000002.wav -------------------------------------------------------------------------------- /docs/samples/seen/ground_truth/337_126286_000008_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/ground_truth/337_126286_000008_000000.wav -------------------------------------------------------------------------------- /docs/samples/seen/ground_truth/3537_5704_000008_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/ground_truth/3537_5704_000008_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/ground_truth/5319_84357_000005_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/ground_truth/5319_84357_000005_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/ground_truth/6294_86679_000035_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/ground_truth/6294_86679_000035_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/ground_truth/949_134657_000002_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/ground_truth/949_134657_000002_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c16/2004_147967_000029_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c16/2004_147967_000029_000002.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c16/337_126286_000008_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c16/337_126286_000008_000000.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c16/3537_5704_000008_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c16/3537_5704_000008_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c16/5319_84357_000005_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c16/5319_84357_000005_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c16/6294_86679_000035_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c16/6294_86679_000035_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c32/2004_147967_000029_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c32/2004_147967_000029_000002.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c32/337_126286_000008_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c32/337_126286_000008_000000.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c32/3537_5704_000008_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c32/3537_5704_000008_000005.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c32/5319_84357_000005_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c32/5319_84357_000005_000004.wav -------------------------------------------------------------------------------- /docs/samples/seen/official_c32/6294_86679_000035_000004.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/seen/official_c32/6294_86679_000035_000004.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c16/1089_134686_000007_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c16/1089_134686_000007_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c16/3575_170457_000037_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c16/3575_170457_000037_000002.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c16/4507_16021_000029_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c16/4507_16021_000029_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c16/7021_85628_000037_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c16/7021_85628_000037_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c16/7176_92135_000006_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c16/7176_92135_000006_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c16/8224_274384_000016_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c16/8224_274384_000016_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c32/1089_134686_000007_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c32/1089_134686_000007_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c32/3575_170457_000037_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c32/3575_170457_000037_000002.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c32/4507_16021_000029_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c32/4507_16021_000029_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c32/7021_85628_000037_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c32/7021_85628_000037_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c32/7176_92135_000006_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c32/7176_92135_000006_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/c32/8224_274384_000016_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/c32/8224_274384_000016_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/ground_truth/1089_134686_000007_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/ground_truth/1089_134686_000007_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/ground_truth/3575_170457_000037_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/ground_truth/3575_170457_000037_000002.wav -------------------------------------------------------------------------------- /docs/samples/unseen/ground_truth/4507_16021_000029_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/ground_truth/4507_16021_000029_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/ground_truth/7021_85628_000037_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/ground_truth/7021_85628_000037_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/ground_truth/7176_92135_000006_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/ground_truth/7176_92135_000006_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/ground_truth/8224_274384_000016_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/ground_truth/8224_274384_000016_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c16/1089_134686_000007_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c16/1089_134686_000007_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c16/3575_170457_000037_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c16/3575_170457_000037_000002.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c16/7021_85628_000037_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c16/7021_85628_000037_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c16/7176_92135_000006_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c16/7176_92135_000006_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c16/8224_274384_000016_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c16/8224_274384_000016_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c32/1089_134686_000007_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c32/1089_134686_000007_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c32/3575_170457_000037_000002.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c32/3575_170457_000037_000002.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c32/7021_85628_000037_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c32/7021_85628_000037_000000.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c32/7176_92135_000006_000005.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c32/7176_92135_000006_000005.wav -------------------------------------------------------------------------------- /docs/samples/unseen/official_c32/8224_274384_000016_000000.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/docs/samples/unseen/official_c32/8224_274384_000016_000000.wav -------------------------------------------------------------------------------- /inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/inference.py -------------------------------------------------------------------------------- /model/discriminator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/model/discriminator.py -------------------------------------------------------------------------------- /model/generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/model/generator.py -------------------------------------------------------------------------------- /model/lvcnet.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/model/lvcnet.py -------------------------------------------------------------------------------- /model/mpd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/model/mpd.py -------------------------------------------------------------------------------- /model/mrd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/model/mrd.py -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/requirements.txt -------------------------------------------------------------------------------- /trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/trainer.py -------------------------------------------------------------------------------- /utils/plotting.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/plotting.py -------------------------------------------------------------------------------- /utils/stft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/stft.py -------------------------------------------------------------------------------- /utils/stft_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/stft_loss.py -------------------------------------------------------------------------------- /utils/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/train.py -------------------------------------------------------------------------------- /utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/utils.py -------------------------------------------------------------------------------- /utils/validation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/validation.py -------------------------------------------------------------------------------- /utils/writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/maum-ai/univnet/HEAD/utils/writer.py --------------------------------------------------------------------------------