├── .DS_Store ├── Demo_json_files ├── Demo_npy_energy.json ├── Demo_textgrid.json └── Demo_wav.json ├── DiffAR200_C=128 ├── GPU_utilization.pdf └── dd.txt ├── Examples ├── .DS_Store ├── Ablation_study │ ├── DiffAR+P_LJ003-0228_0.wav │ ├── DiffAR+P_LJ034-0183_0.wav │ ├── DiffAR+P_LJ038-0257_0.wav │ ├── DiffAR+P_LJ050-0116_0.wav │ ├── DiffAR-E_LJ003-0228_0.wav │ ├── DiffAR-E_LJ034-0183_0.wav │ ├── DiffAR-E_LJ038-0257_0.wav │ ├── DiffAR-E_LJ050-0116_0.wav │ ├── DiffAR_1000_LJ003-0228_0.wav │ ├── DiffAR_1000_LJ034-0183_0.wav │ ├── DiffAR_1000_LJ038-0257_0.wav │ ├── DiffAR_1000_LJ050-0116_0.wav │ ├── DiffAR_200_LJ003-0228_0.wav │ ├── DiffAR_200_LJ034-0183_0.wav │ ├── DiffAR_200_LJ038-0257_0.wav │ ├── DiffAR_200_LJ050-0116_0.wav │ ├── LJ003-0228.wav │ ├── LJ034-0183.wav │ ├── LJ038-0257.wav │ └── LJ050-0116.wav ├── Architecture_figures │ ├── DiffAR_lr_and_dim.pdf │ └── tt.txt ├── Conditional_generation │ ├── DiffAR_1000_predicted_LJ019-0361_0wav.wav │ ├── DiffAR_1000_predicted_LJ038-0126_0.wav │ ├── DiffAR_1000_predicted_LJ038-0242_0.wav │ ├── DiffAR_1000_predicted_LJ043-0004_0.wav │ ├── DiffAR_200_predicted_LJ019-0361_0.wav │ ├── DiffAR_200_predicted_LJ019-0361_1.wav │ ├── DiffAR_200_predicted_LJ038-0126_0.wav │ ├── DiffAR_200_predicted_LJ038-0242_0.wav │ ├── DiffAR_200_predicted_LJ043-0004_0.wav │ ├── FastSpeech_LJ002-0019_900k_0.wav │ ├── FastSpeech_LJ019-0361_900k_0.wav │ ├── FastSpeech_LJ038-0126_900k_0.wav │ ├── FastSpeech_LJ038-0242_900k_0.wav │ ├── FastSpeech_LJ043-0004_900k_0.wav │ ├── WaveGrad_LJ019-0361_0.wav │ ├── WaveGrad_LJ019-0361_1.wav │ ├── WaveGrad_LJ038-0126_0.wav │ ├── WaveGrad_LJ038-0126_1.wav │ ├── WaveGrad_LJ038-0242_0.wav │ ├── WaveGrad_LJ043-0004_0.wav │ └── ddd.txt ├── Focal_Fry │ ├── .DS_Store │ ├── DiffAR_200_LJ020-0061_Worm.wav │ ├── DiffAR_200_Worm_Waveform.png │ ├── DiffAR_200_Worm_spec.png │ ├── FastSpeech2_LJ020-0061_Worm.wav │ ├── FastSpeech2_Worm_Spec.png │ ├── FastSpeech2_Worm_Waveform.png │ ├── WaveGrad2_LJ020-0061_Worm.wav │ ├── WaveGrad2_Worm_Spec.png │ └── WaveGrad2_Worm_WaveForm.png ├── Full_vocal_fry_sentences │ ├── 128050_0_predicted_LJ020-0061.wav │ ├── 918100_1_seed_1_LJ015-0115.wav │ ├── 918100_1_seed_1_LJ018-0013_good.wav │ ├── 918100_1_seed_1_LJ038-0126.wav │ ├── 918100_4_seed_5_LJ002-0019.wav │ ├── 918100_7_seed_8_LJ050-0116_pg.wav │ ├── 918100_8_seed_9_LJ038-0257_pg.wav │ └── 918100_predicted_LJ050-0022_iter_0_seed_1.wav ├── Multiply_speakers │ ├── CSTR_VCTK_EXAMPLES │ │ ├── DiffAR-VCTK_results │ │ │ ├── 423300_0_p253_108_mic2_.wav │ │ │ ├── 423300_0_p271_065_mic2_.wav │ │ │ ├── 423300_0_p271_150_mic2_.wav │ │ │ ├── 423300_0_p271_153_mic2_.wav │ │ │ ├── 423300_0_p272_312_mic2_.wav │ │ │ ├── 423300_0_p272_317_mic2_.wav │ │ │ ├── 423300_0_p272_336_mic2_.wav │ │ │ ├── 423300_0_p316_025_mic2_.wav │ │ │ ├── 423300_0_p316_357_mic2_.wav │ │ │ ├── 423300_0_p335_163_mic2_.wav │ │ │ ├── 423300_0_p335_169_mic2_.wav │ │ │ ├── 423300_0_p339_298_mic2_.wav │ │ │ ├── 423300_0_p339_300_mic2_.wav │ │ │ ├── 423300_0_p376_003_mic2_.wav │ │ │ └── cc.txt │ │ └── original_wavs │ │ │ ├── p271_150_mic2.wav │ │ │ ├── p271_153_mic2.wav │ │ │ ├── p272_312_mic2.wav │ │ │ ├── p272_317_mic2.wav │ │ │ ├── p272_336_mic2.wav │ │ │ ├── p316_357_mic2.wav │ │ │ ├── p335_163_mic2.wav │ │ │ ├── p335_169_mic2.wav │ │ │ ├── p339_298_mic2.wav │ │ │ ├── p339_300_mic2.wav │ │ │ └── tt.txt │ ├── Multiply_speakers_architecture.pdf │ ├── Several_speakers_architecture.pdf │ └── tt.txt ├── Showing_stochasticity │ ├── .DS_Store │ ├── DiffAR+P_LJ_050_0116_0.wav │ ├── DiffAR+P_LJ_050_0116_1.wav │ ├── DiffAR+P_LJ_050_0116_2.wav │ ├── DiffAR+P_energy.png │ ├── DiffAR+P_pitch.png │ ├── DiffAR-E_LJ050-0116_0.wav │ ├── DiffAR-E_LJ050-0116_1.wav │ ├── DiffAR-E_LJ050-0116_2.wav │ ├── DiffAR-E_energy.png │ ├── DiffAR-E_pitch.png │ ├── DiffAR_200_energy.png │ ├── DiffAR_200_pitch.png │ ├── DiffAR_LJ050-0116_0.wav │ ├── DiffAR_LJ050-0116_1.wav │ └── Screen Shot 2023-10-05 at 16.13.09.png ├── Unconditional_generation │ ├── unconditioanl_gen_1s_500ms_0.wav │ ├── unconditioanl_gen_1s_500ms_1.wav │ ├── unconditioanl_gen_1s_500ms_2.wav │ ├── unconditioanl_gen_1s_500ms_3.wav │ ├── unconditioanl_gen_400ms_200ms_1.wav │ ├── unconditioanl_gen_400ms_200ms_2.wav │ ├── unconditioanl_gen_400ms_200ms_3.wav │ ├── unconditioanl_gen_400ms_200ms_4.wav │ ├── unconditioanl_gen_500ms_250ms_0.wav │ ├── unconditioanl_gen_500ms_250ms_1.wav │ ├── unconditioanl_gen_500ms_250ms_2.wav │ ├── unconditioanl_gen_500ms_250ms_3.wav │ └── unconditioanl_gen_500ms_250ms_4.wav ├── Vocal_Fry │ ├── .DS_Store │ ├── DiffAR_200_LJ020-0061_Worm.wav │ ├── DiffAR_200_Worm_Waveform.png │ ├── DiffAR_200_Worm_spec.png │ ├── FastSpeech2_LJ020-0061_Worm.wav │ ├── FastSpeech2_Worm_Spec.png │ ├── FastSpeech2_Worm_Waveform.png │ ├── WaveGrad2_LJ020-0061_Worm.wav │ ├── WaveGrad2_Worm_Spec.png │ └── WaveGrad2_Worm_WaveForm.png ├── baselines_stochasticity │ ├── DiffGAN_energy.pdf │ ├── DiffGAN_pitch.pdf │ ├── Grad_TTS_energy.pdf │ ├── Grad_TTS_pitch.pdf │ ├── ProDiff_energy.pdf │ ├── ProDiff_pitch.pdf │ ├── VITS_energy.pdf │ ├── VITS_pitch.pdf │ └── tt.txt └── train_loss │ ├── DiffAR200_train_loss.png │ └── dd.txt ├── LICENSE ├── README.md ├── __main__.py ├── audio.py ├── conf └── conf.yaml ├── distrib.py ├── docs ├── .DS_Store ├── frame_explain_2.png ├── index.html ├── styles.css └── ttf_font_files │ ├── Helvetica CE Narrow.woff │ ├── SpaceMono-Regular.ttf │ └── SpaceMono-Regular.woff ├── duration_predictors_files ├── Text_To_Speech_Procedure.py ├── duration_predictor.py ├── duration_predictor.yaml ├── playground_duration.py └── saved_models │ └── predictor_model_sec_dividing_kernel_5.ckpt ├── empty_sec_audio.wav ├── energy_predictor_files ├── Text_To_Speech_Procedure.py ├── energy_predictor.py ├── energy_predictor.yaml ├── energy_predictor_utils.py ├── playground_energy.py └── saved_models │ └── energy_predictor_model_2_layers_7_5_k.ckpt ├── eval.py ├── folder2json.py ├── folder2json_npy.py ├── folder2json_text.py ├── inference.py ├── learner.py ├── model.py ├── params.py └── utils_for_inference.py /.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/.DS_Store -------------------------------------------------------------------------------- /Demo_json_files/Demo_npy_energy.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Demo_json_files/Demo_npy_energy.json -------------------------------------------------------------------------------- /Demo_json_files/Demo_textgrid.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Demo_json_files/Demo_textgrid.json -------------------------------------------------------------------------------- /Demo_json_files/Demo_wav.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Demo_json_files/Demo_wav.json -------------------------------------------------------------------------------- /DiffAR200_C=128/GPU_utilization.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/DiffAR200_C=128/GPU_utilization.pdf -------------------------------------------------------------------------------- /DiffAR200_C=128/dd.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/.DS_Store -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR+P_LJ003-0228_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR+P_LJ003-0228_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR+P_LJ034-0183_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR+P_LJ034-0183_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR+P_LJ038-0257_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR+P_LJ038-0257_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR+P_LJ050-0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR+P_LJ050-0116_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR-E_LJ003-0228_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR-E_LJ003-0228_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR-E_LJ034-0183_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR-E_LJ034-0183_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR-E_LJ038-0257_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR-E_LJ038-0257_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR-E_LJ050-0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR-E_LJ050-0116_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_1000_LJ003-0228_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_1000_LJ003-0228_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_1000_LJ034-0183_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_1000_LJ034-0183_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_1000_LJ038-0257_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_1000_LJ038-0257_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_1000_LJ050-0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_1000_LJ050-0116_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_200_LJ003-0228_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_200_LJ003-0228_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_200_LJ034-0183_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_200_LJ034-0183_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_200_LJ038-0257_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_200_LJ038-0257_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/DiffAR_200_LJ050-0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/DiffAR_200_LJ050-0116_0.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/LJ003-0228.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/LJ003-0228.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/LJ034-0183.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/LJ034-0183.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/LJ038-0257.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/LJ038-0257.wav -------------------------------------------------------------------------------- /Examples/Ablation_study/LJ050-0116.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Ablation_study/LJ050-0116.wav -------------------------------------------------------------------------------- /Examples/Architecture_figures/DiffAR_lr_and_dim.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Architecture_figures/DiffAR_lr_and_dim.pdf -------------------------------------------------------------------------------- /Examples/Architecture_figures/tt.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_1000_predicted_LJ019-0361_0wav.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_1000_predicted_LJ019-0361_0wav.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_1000_predicted_LJ038-0126_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_1000_predicted_LJ038-0126_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_1000_predicted_LJ038-0242_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_1000_predicted_LJ038-0242_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_1000_predicted_LJ043-0004_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_1000_predicted_LJ043-0004_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_200_predicted_LJ019-0361_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_200_predicted_LJ019-0361_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_200_predicted_LJ019-0361_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_200_predicted_LJ019-0361_1.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_200_predicted_LJ038-0126_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_200_predicted_LJ038-0126_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_200_predicted_LJ038-0242_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_200_predicted_LJ038-0242_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/DiffAR_200_predicted_LJ043-0004_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/DiffAR_200_predicted_LJ043-0004_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/FastSpeech_LJ002-0019_900k_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/FastSpeech_LJ002-0019_900k_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/FastSpeech_LJ019-0361_900k_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/FastSpeech_LJ019-0361_900k_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/FastSpeech_LJ038-0126_900k_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/FastSpeech_LJ038-0126_900k_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/FastSpeech_LJ038-0242_900k_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/FastSpeech_LJ038-0242_900k_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/FastSpeech_LJ043-0004_900k_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/FastSpeech_LJ043-0004_900k_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/WaveGrad_LJ019-0361_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/WaveGrad_LJ019-0361_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/WaveGrad_LJ019-0361_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/WaveGrad_LJ019-0361_1.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/WaveGrad_LJ038-0126_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/WaveGrad_LJ038-0126_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/WaveGrad_LJ038-0126_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/WaveGrad_LJ038-0126_1.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/WaveGrad_LJ038-0242_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/WaveGrad_LJ038-0242_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/WaveGrad_LJ043-0004_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Conditional_generation/WaveGrad_LJ043-0004_0.wav -------------------------------------------------------------------------------- /Examples/Conditional_generation/ddd.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/Focal_Fry/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/.DS_Store -------------------------------------------------------------------------------- /Examples/Focal_Fry/DiffAR_200_LJ020-0061_Worm.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/DiffAR_200_LJ020-0061_Worm.wav -------------------------------------------------------------------------------- /Examples/Focal_Fry/DiffAR_200_Worm_Waveform.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/DiffAR_200_Worm_Waveform.png -------------------------------------------------------------------------------- /Examples/Focal_Fry/DiffAR_200_Worm_spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/DiffAR_200_Worm_spec.png -------------------------------------------------------------------------------- /Examples/Focal_Fry/FastSpeech2_LJ020-0061_Worm.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/FastSpeech2_LJ020-0061_Worm.wav -------------------------------------------------------------------------------- /Examples/Focal_Fry/FastSpeech2_Worm_Spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/FastSpeech2_Worm_Spec.png -------------------------------------------------------------------------------- /Examples/Focal_Fry/FastSpeech2_Worm_Waveform.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/FastSpeech2_Worm_Waveform.png -------------------------------------------------------------------------------- /Examples/Focal_Fry/WaveGrad2_LJ020-0061_Worm.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/WaveGrad2_LJ020-0061_Worm.wav -------------------------------------------------------------------------------- /Examples/Focal_Fry/WaveGrad2_Worm_Spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/WaveGrad2_Worm_Spec.png -------------------------------------------------------------------------------- /Examples/Focal_Fry/WaveGrad2_Worm_WaveForm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Focal_Fry/WaveGrad2_Worm_WaveForm.png -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/128050_0_predicted_LJ020-0061.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/128050_0_predicted_LJ020-0061.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_1_seed_1_LJ015-0115.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_1_seed_1_LJ015-0115.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_1_seed_1_LJ018-0013_good.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_1_seed_1_LJ018-0013_good.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_1_seed_1_LJ038-0126.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_1_seed_1_LJ038-0126.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_4_seed_5_LJ002-0019.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_4_seed_5_LJ002-0019.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_7_seed_8_LJ050-0116_pg.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_7_seed_8_LJ050-0116_pg.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_8_seed_9_LJ038-0257_pg.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_8_seed_9_LJ038-0257_pg.wav -------------------------------------------------------------------------------- /Examples/Full_vocal_fry_sentences/918100_predicted_LJ050-0022_iter_0_seed_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Full_vocal_fry_sentences/918100_predicted_LJ050-0022_iter_0_seed_1.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p253_108_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p253_108_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p271_065_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p271_065_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p271_150_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p271_150_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p271_153_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p271_153_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p272_312_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p272_312_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p272_317_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p272_317_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p272_336_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p272_336_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p316_025_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p316_025_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p316_357_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p316_357_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p335_163_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p335_163_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p335_169_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p335_169_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p339_298_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p339_298_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p339_300_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p339_300_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p376_003_mic2_.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/423300_0_p376_003_mic2_.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/DiffAR-VCTK_results/cc.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p271_150_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p271_150_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p271_153_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p271_153_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p272_312_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p272_312_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p272_317_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p272_317_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p272_336_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p272_336_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p316_357_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p316_357_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p335_163_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p335_163_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p335_169_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p335_169_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p339_298_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p339_298_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p339_300_mic2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/p339_300_mic2.wav -------------------------------------------------------------------------------- /Examples/Multiply_speakers/CSTR_VCTK_EXAMPLES/original_wavs/tt.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/Multiply_speakers/Multiply_speakers_architecture.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/Multiply_speakers_architecture.pdf -------------------------------------------------------------------------------- /Examples/Multiply_speakers/Several_speakers_architecture.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Multiply_speakers/Several_speakers_architecture.pdf -------------------------------------------------------------------------------- /Examples/Multiply_speakers/tt.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/.DS_Store -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR+P_LJ_050_0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR+P_LJ_050_0116_0.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR+P_LJ_050_0116_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR+P_LJ_050_0116_1.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR+P_LJ_050_0116_2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR+P_LJ_050_0116_2.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR+P_energy.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR+P_energy.png -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR+P_pitch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR+P_pitch.png -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR-E_LJ050-0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR-E_LJ050-0116_0.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR-E_LJ050-0116_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR-E_LJ050-0116_1.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR-E_LJ050-0116_2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR-E_LJ050-0116_2.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR-E_energy.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR-E_energy.png -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR-E_pitch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR-E_pitch.png -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR_200_energy.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR_200_energy.png -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR_200_pitch.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR_200_pitch.png -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR_LJ050-0116_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR_LJ050-0116_0.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/DiffAR_LJ050-0116_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/DiffAR_LJ050-0116_1.wav -------------------------------------------------------------------------------- /Examples/Showing_stochasticity/Screen Shot 2023-10-05 at 16.13.09.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Showing_stochasticity/Screen Shot 2023-10-05 at 16.13.09.png -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_0.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_1.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_2.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_3.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_1s_500ms_3.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_1.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_2.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_3.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_3.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_4.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_400ms_200ms_4.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_0.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_0.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_1.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_2.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_3.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_3.wav -------------------------------------------------------------------------------- /Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_4.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Unconditional_generation/unconditioanl_gen_500ms_250ms_4.wav -------------------------------------------------------------------------------- /Examples/Vocal_Fry/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/.DS_Store -------------------------------------------------------------------------------- /Examples/Vocal_Fry/DiffAR_200_LJ020-0061_Worm.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/DiffAR_200_LJ020-0061_Worm.wav -------------------------------------------------------------------------------- /Examples/Vocal_Fry/DiffAR_200_Worm_Waveform.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/DiffAR_200_Worm_Waveform.png -------------------------------------------------------------------------------- /Examples/Vocal_Fry/DiffAR_200_Worm_spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/DiffAR_200_Worm_spec.png -------------------------------------------------------------------------------- /Examples/Vocal_Fry/FastSpeech2_LJ020-0061_Worm.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/FastSpeech2_LJ020-0061_Worm.wav -------------------------------------------------------------------------------- /Examples/Vocal_Fry/FastSpeech2_Worm_Spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/FastSpeech2_Worm_Spec.png -------------------------------------------------------------------------------- /Examples/Vocal_Fry/FastSpeech2_Worm_Waveform.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/FastSpeech2_Worm_Waveform.png -------------------------------------------------------------------------------- /Examples/Vocal_Fry/WaveGrad2_LJ020-0061_Worm.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/WaveGrad2_LJ020-0061_Worm.wav -------------------------------------------------------------------------------- /Examples/Vocal_Fry/WaveGrad2_Worm_Spec.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/WaveGrad2_Worm_Spec.png -------------------------------------------------------------------------------- /Examples/Vocal_Fry/WaveGrad2_Worm_WaveForm.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/Vocal_Fry/WaveGrad2_Worm_WaveForm.png -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/DiffGAN_energy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/DiffGAN_energy.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/DiffGAN_pitch.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/DiffGAN_pitch.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/Grad_TTS_energy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/Grad_TTS_energy.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/Grad_TTS_pitch.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/Grad_TTS_pitch.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/ProDiff_energy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/ProDiff_energy.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/ProDiff_pitch.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/ProDiff_pitch.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/VITS_energy.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/VITS_energy.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/VITS_pitch.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/baselines_stochasticity/VITS_pitch.pdf -------------------------------------------------------------------------------- /Examples/baselines_stochasticity/tt.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /Examples/train_loss/DiffAR200_train_loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/Examples/train_loss/DiffAR200_train_loss.png -------------------------------------------------------------------------------- /Examples/train_loss/dd.txt: -------------------------------------------------------------------------------- 1 | 2 | -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/README.md -------------------------------------------------------------------------------- /__main__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/__main__.py -------------------------------------------------------------------------------- /audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/audio.py -------------------------------------------------------------------------------- /conf/conf.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/conf/conf.yaml -------------------------------------------------------------------------------- /distrib.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/distrib.py -------------------------------------------------------------------------------- /docs/.DS_Store: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/.DS_Store -------------------------------------------------------------------------------- /docs/frame_explain_2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/frame_explain_2.png -------------------------------------------------------------------------------- /docs/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/index.html -------------------------------------------------------------------------------- /docs/styles.css: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/styles.css -------------------------------------------------------------------------------- /docs/ttf_font_files/Helvetica CE Narrow.woff: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/ttf_font_files/Helvetica CE Narrow.woff -------------------------------------------------------------------------------- /docs/ttf_font_files/SpaceMono-Regular.ttf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/ttf_font_files/SpaceMono-Regular.ttf -------------------------------------------------------------------------------- /docs/ttf_font_files/SpaceMono-Regular.woff: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/docs/ttf_font_files/SpaceMono-Regular.woff -------------------------------------------------------------------------------- /duration_predictors_files/Text_To_Speech_Procedure.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/duration_predictors_files/Text_To_Speech_Procedure.py -------------------------------------------------------------------------------- /duration_predictors_files/duration_predictor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/duration_predictors_files/duration_predictor.py -------------------------------------------------------------------------------- /duration_predictors_files/duration_predictor.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/duration_predictors_files/duration_predictor.yaml -------------------------------------------------------------------------------- /duration_predictors_files/playground_duration.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/duration_predictors_files/playground_duration.py -------------------------------------------------------------------------------- /duration_predictors_files/saved_models/predictor_model_sec_dividing_kernel_5.ckpt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/duration_predictors_files/saved_models/predictor_model_sec_dividing_kernel_5.ckpt -------------------------------------------------------------------------------- /empty_sec_audio.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/empty_sec_audio.wav -------------------------------------------------------------------------------- /energy_predictor_files/Text_To_Speech_Procedure.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/energy_predictor_files/Text_To_Speech_Procedure.py -------------------------------------------------------------------------------- /energy_predictor_files/energy_predictor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/energy_predictor_files/energy_predictor.py -------------------------------------------------------------------------------- /energy_predictor_files/energy_predictor.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/energy_predictor_files/energy_predictor.yaml -------------------------------------------------------------------------------- /energy_predictor_files/energy_predictor_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/energy_predictor_files/energy_predictor_utils.py -------------------------------------------------------------------------------- /energy_predictor_files/playground_energy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/energy_predictor_files/playground_energy.py -------------------------------------------------------------------------------- /energy_predictor_files/saved_models/energy_predictor_model_2_layers_7_5_k.ckpt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/energy_predictor_files/saved_models/energy_predictor_model_2_layers_7_5_k.ckpt -------------------------------------------------------------------------------- /eval.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/eval.py -------------------------------------------------------------------------------- /folder2json.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/folder2json.py -------------------------------------------------------------------------------- /folder2json_npy.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/folder2json_npy.py -------------------------------------------------------------------------------- /folder2json_text.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/folder2json_text.py -------------------------------------------------------------------------------- /inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/inference.py -------------------------------------------------------------------------------- /learner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/learner.py -------------------------------------------------------------------------------- /model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/model.py -------------------------------------------------------------------------------- /params.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/params.py -------------------------------------------------------------------------------- /utils_for_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/RBenita/DIFFAR/HEAD/utils_for_inference.py --------------------------------------------------------------------------------