├── README.md ├── egs2 ├── aishell │ ├── asr_unimodal.sh │ ├── exp_uma_conformer_12e_69 │ │ └── asr_train_asr_unimodal_conformer_raw_zh_char_sp │ │ │ ├── RESULTS.md │ │ │ ├── config.yaml │ │ │ ├── images │ │ │ ├── backward_time.png │ │ │ ├── cer.png │ │ │ ├── cer_ctc.png │ │ │ ├── forward_time.png │ │ │ ├── gpu_max_cached_mem_GB.png │ │ │ ├── iter_time.png │ │ │ ├── loss.png │ │ │ ├── loss_ctc.png │ │ │ ├── optim0_lr0.png │ │ │ ├── optim_step_time.png │ │ │ └── train_time.png │ │ │ └── train.log │ ├── exp_uma_conformer_condition0302_32_731 │ │ └── asr_train_asr_uma_conformer_condition_raw_zh_char_sp │ │ │ ├── RESULTS.md │ │ │ ├── config.yaml │ │ │ ├── images │ │ │ ├── backward_time.png │ │ │ ├── cer.png │ │ │ ├── cer_ctc.png │ │ │ ├── cer_interctc_declayer2.png │ │ │ ├── cer_interctc_declayer4.png │ │ │ ├── cer_interctc_enclayer12.png │ │ │ ├── cer_interctc_enclayer6.png │ │ │ ├── cer_interctc_enclayer9.png │ │ │ ├── forward_time.png │ │ │ ├── gpu_max_cached_mem_GB.png │ │ │ ├── iter_time.png │ │ │ ├── loss.png │ │ │ ├── loss_ctc.png │ │ │ ├── loss_interctc_declayer2.png │ │ │ ├── loss_interctc_declayer4.png │ │ │ ├── loss_interctc_enclayer12.png │ │ │ ├── loss_interctc_enclayer6.png │ │ │ ├── loss_interctc_enclayer9.png │ │ │ ├── optim0_lr0.png │ │ │ ├── optim_step_time.png │ │ │ └── train_time.png │ │ │ └── train.log │ ├── exp_uma_mamba_0617 │ │ └── asr_train_asr_uma_mamba_raw_zh_char_sp │ │ │ ├── RESULTS.md │ │ │ ├── config.yaml │ │ │ ├── images │ │ │ ├── backward_time.png │ │ │ ├── cer.png │ │ │ ├── cer_ctc.png │ │ │ ├── forward_time.png │ │ │ ├── gpu_max_cached_mem_GB.png │ │ │ ├── iter_time.png │ │ │ ├── loss.png │ │ │ ├── loss_ctc.png │ │ │ ├── optim0_lr0.png │ │ │ ├── optim_step_time.png │ │ │ ├── text_vs_uma.png │ │ │ ├── train_time.png │ │ │ └── uma_reduction.png │ │ │ ├── train.1.log │ │ │ └── train.2.log │ ├── run_unimodal.sh │ └── umaconf │ │ ├── decode_asr_uma.yaml │ │ ├── train_asr_uma_conformer.yaml │ │ ├── train_asr_uma_conformer_condition.yaml │ │ └── train_asr_uma_mamba.yaml ├── aishell2 │ ├── asr_unimodal.sh │ ├── exp_uma_conformer_12e_718 │ │ ├── asr_train_asr_uma_conformer_condition_raw_zh_char_sp │ │ │ ├── RESULTS.md │ │ │ ├── config.yaml │ │ │ ├── images │ │ │ │ ├── backward_time.png │ │ │ │ ├── cer.png │ │ │ │ ├── cer_ctc.png │ │ │ │ ├── cer_interctc_declayer2.png │ │ │ │ ├── cer_interctc_declayer4.png │ │ │ │ ├── cer_interctc_enclayer12.png │ │ │ │ ├── cer_interctc_enclayer6.png │ │ │ │ ├── cer_interctc_enclayer9.png │ │ │ │ ├── forward_time.png │ │ │ │ ├── gpu_max_cached_mem_GB.png │ │ │ │ ├── iter_time.png │ │ │ │ ├── loss.png │ │ │ │ ├── loss_ctc.png │ │ │ │ ├── loss_interctc_declayer2.png │ │ │ │ ├── loss_interctc_declayer4.png │ │ │ │ ├── loss_interctc_enclayer12.png │ │ │ │ ├── loss_interctc_enclayer6.png │ │ │ │ ├── loss_interctc_enclayer9.png │ │ │ │ ├── optim0_lr0.png │ │ │ │ ├── optim_step_time.png │ │ │ │ └── train_time.png │ │ │ └── train.log │ │ └── asr_train_asr_uma_conformer_raw_zh_char_sp │ │ │ ├── RESULTS.md │ │ │ ├── config.yaml │ │ │ ├── images │ │ │ ├── backward_time.png │ │ │ ├── cer.png │ │ │ ├── cer_ctc.png │ │ │ ├── forward_time.png │ │ │ ├── gpu_max_cached_mem_GB.png │ │ │ ├── iter_time.png │ │ │ ├── loss.png │ │ │ ├── loss_ctc.png │ │ │ ├── optim0_lr0.png │ │ │ ├── optim_step_time.png │ │ │ └── train_time.png │ │ │ └── train.log │ ├── exp_uma_mamba_0819 │ │ └── asr_train_asr_uma_mamba_b_raw_zh_char_sp │ │ │ ├── RESULTS.md │ │ │ ├── config.yaml │ │ │ ├── images │ │ │ ├── backward_time.png │ │ │ ├── cer.png │ │ │ ├── cer_ctc.png │ │ │ ├── forward_time.png │ │ │ ├── gpu_max_cached_mem_GB.png │ │ │ ├── iter_time.png │ │ │ ├── loss.png │ │ │ ├── loss_ctc.png │ │ │ ├── optim0_lr0.png │ │ │ ├── optim_step_time.png │ │ │ ├── text_vs_uma.png │ │ │ ├── train_time.png │ │ │ └── uma_reduction.png │ │ │ └── train.log │ ├── run_unimodal.sh │ └── umaconf │ │ ├── decode_asr_uma.yaml │ │ ├── train_asr_uma_conformer.yaml │ │ ├── train_asr_uma_conformer_condition.yaml │ │ └── train_asr_uma_mamba_b.yaml └── hkust │ ├── asr_unimodal.sh │ ├── exp_uma_branchformer_12e_69 │ └── asr_train_asr_uma_branchformer_raw_zh_char_sp │ │ ├── RESULTS.md │ │ ├── config.yaml │ │ ├── images │ │ ├── backward_time.png │ │ ├── cer.png │ │ ├── cer_ctc.png │ │ ├── forward_time.png │ │ ├── gpu_max_cached_mem_GB.png │ │ ├── iter_time.png │ │ ├── loss.png │ │ ├── loss_ctc.png │ │ ├── optim0_lr0.png │ │ ├── optim_step_time.png │ │ └── train_time.png │ │ └── train.log │ ├── exp_uma_branchformer_condition0302_32_711 │ └── asr_train_asr_uma_branchformer_condition_raw_zh_char_sp │ │ ├── RESULTS.md │ │ ├── config.yaml │ │ ├── images │ │ ├── backward_time.png │ │ ├── cer.png │ │ ├── cer_ctc.png │ │ ├── cer_interctc_declayer2.png │ │ ├── cer_interctc_declayer4.png │ │ ├── cer_interctc_enclayer12.png │ │ ├── cer_interctc_enclayer6.png │ │ ├── cer_interctc_enclayer9.png │ │ ├── forward_time.png │ │ ├── gpu_max_cached_mem_GB.png │ │ ├── iter_time.png │ │ ├── loss.png │ │ ├── loss_ctc.png │ │ ├── loss_interctc_declayer2.png │ │ ├── loss_interctc_declayer4.png │ │ ├── loss_interctc_enclayer12.png │ │ ├── loss_interctc_enclayer6.png │ │ ├── loss_interctc_enclayer9.png │ │ ├── optim0_lr0.png │ │ ├── optim_step_time.png │ │ └── train_time.png │ │ └── train.log │ ├── exp_uma_conformer_12e_67 │ └── asr_train_asr_uma_conformer_raw_zh_char_sp │ │ ├── RESULTS.md │ │ ├── config.yaml │ │ ├── images │ │ ├── backward_time.png │ │ ├── cer.png │ │ ├── cer_ctc.png │ │ ├── forward_time.png │ │ ├── gpu_max_cached_mem_GB.png │ │ ├── iter_time.png │ │ ├── loss.png │ │ ├── loss_ctc.png │ │ ├── optim0_lr0.png │ │ ├── optim_step_time.png │ │ └── train_time.png │ │ └── train.log │ ├── exp_uma_conformer_condition0302_32_712 │ └── asr_train_asr_uma_conformer_condition_raw_zh_char_sp │ │ ├── RESULTS.md │ │ ├── config.yaml │ │ ├── images │ │ ├── backward_time.png │ │ ├── cer.png │ │ ├── cer_ctc.png │ │ ├── cer_interctc_declayer2.png │ │ ├── cer_interctc_declayer4.png │ │ ├── cer_interctc_enclayer12.png │ │ ├── cer_interctc_enclayer6.png │ │ ├── cer_interctc_enclayer9.png │ │ ├── forward_time.png │ │ ├── gpu_max_cached_mem_GB.png │ │ ├── iter_time.png │ │ ├── loss.png │ │ ├── loss_ctc.png │ │ ├── loss_interctc_declayer2.png │ │ ├── loss_interctc_declayer4.png │ │ ├── loss_interctc_enclayer12.png │ │ ├── loss_interctc_enclayer6.png │ │ ├── loss_interctc_enclayer9.png │ │ ├── optim0_lr0.png │ │ ├── optim_step_time.png │ │ └── train_time.png │ │ └── train.log │ ├── run_unimodal.sh │ └── umaconf │ ├── decode_asr_uma.yaml │ ├── train_asr_uma_branchformer.yaml │ ├── train_asr_uma_branchformer_condition.yaml │ ├── train_asr_uma_conformer.yaml │ └── train_asr_uma_conformer_condition.yaml ├── espnet2 ├── asr │ ├── decoder │ │ └── unimodal_attention_decoder.py │ ├── encoder │ │ ├── conformer_encoder.py │ │ ├── e_branchformer_condition_encoder.py │ │ └── mamba_encoder.py │ ├── mamba_ssm │ │ ├── __init__.py │ │ ├── modules │ │ │ ├── __init__.py │ │ │ └── mamba_simple.py │ │ ├── ops │ │ │ ├── __init__.py │ │ │ ├── __pycache__ │ │ │ │ ├── __init__.cpython-39.pyc │ │ │ │ └── selective_scan_interface.cpython-39.pyc │ │ │ ├── selective_scan_interface.py │ │ │ └── triton │ │ │ │ ├── __init__.py │ │ │ │ ├── __pycache__ │ │ │ │ ├── __init__.cpython-39.pyc │ │ │ │ ├── layernorm.cpython-39.pyc │ │ │ │ └── selective_state_update.cpython-39.pyc │ │ │ │ ├── layernorm.py │ │ │ │ └── selective_state_update.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── generation.py │ │ │ └── hf.py │ ├── uma.py │ └── unimodal_attention_model.py ├── bin │ ├── asr_unimodal_inference.py │ └── asr_unimodal_train.py └── tasks │ └── asr_unimodal.py ├── mamba_uma.png └── uma.png /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/README.md -------------------------------------------------------------------------------- /egs2/aishell/asr_unimodal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/asr_unimodal.sh -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_12e_69/asr_train_asr_unimodal_conformer_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_conformer_condition0302_32_731/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/text_vs_uma.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/text_vs_uma.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/uma_reduction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/images/uma_reduction.png -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/train.1.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/train.1.log -------------------------------------------------------------------------------- /egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/train.2.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/exp_uma_mamba_0617/asr_train_asr_uma_mamba_raw_zh_char_sp/train.2.log -------------------------------------------------------------------------------- /egs2/aishell/run_unimodal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/run_unimodal.sh -------------------------------------------------------------------------------- /egs2/aishell/umaconf/decode_asr_uma.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/umaconf/decode_asr_uma.yaml -------------------------------------------------------------------------------- /egs2/aishell/umaconf/train_asr_uma_conformer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/umaconf/train_asr_uma_conformer.yaml -------------------------------------------------------------------------------- /egs2/aishell/umaconf/train_asr_uma_conformer_condition.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/umaconf/train_asr_uma_conformer_condition.yaml -------------------------------------------------------------------------------- /egs2/aishell/umaconf/train_asr_uma_mamba.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell/umaconf/train_asr_uma_mamba.yaml -------------------------------------------------------------------------------- /egs2/aishell2/asr_unimodal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/asr_unimodal.sh -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_conformer_12e_718/asr_train_asr_uma_conformer_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/text_vs_uma.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/text_vs_uma.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/uma_reduction.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/images/uma_reduction.png -------------------------------------------------------------------------------- /egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/exp_uma_mamba_0819/asr_train_asr_uma_mamba_b_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/aishell2/run_unimodal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/run_unimodal.sh -------------------------------------------------------------------------------- /egs2/aishell2/umaconf/decode_asr_uma.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/umaconf/decode_asr_uma.yaml -------------------------------------------------------------------------------- /egs2/aishell2/umaconf/train_asr_uma_conformer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/umaconf/train_asr_uma_conformer.yaml -------------------------------------------------------------------------------- /egs2/aishell2/umaconf/train_asr_uma_conformer_condition.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/umaconf/train_asr_uma_conformer_condition.yaml -------------------------------------------------------------------------------- /egs2/aishell2/umaconf/train_asr_uma_mamba_b.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/aishell2/umaconf/train_asr_uma_mamba_b.yaml -------------------------------------------------------------------------------- /egs2/hkust/asr_unimodal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/asr_unimodal.sh -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_12e_69/asr_train_asr_uma_branchformer_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_branchformer_condition0302_32_711/asr_train_asr_uma_branchformer_condition_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_12e_67/asr_train_asr_uma_conformer_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/RESULTS.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/RESULTS.md -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/config.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/config.yaml -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/backward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/backward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/cer_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/forward_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/forward_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/gpu_max_cached_mem_GB.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/iter_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/iter_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_ctc.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_ctc.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer2.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_declayer4.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer12.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer6.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/loss_interctc_enclayer9.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim0_lr0.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim0_lr0.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim_step_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/optim_step_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/train_time.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/images/train_time.png -------------------------------------------------------------------------------- /egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/train.log: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/exp_uma_conformer_condition0302_32_712/asr_train_asr_uma_conformer_condition_raw_zh_char_sp/train.log -------------------------------------------------------------------------------- /egs2/hkust/run_unimodal.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/run_unimodal.sh -------------------------------------------------------------------------------- /egs2/hkust/umaconf/decode_asr_uma.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/umaconf/decode_asr_uma.yaml -------------------------------------------------------------------------------- /egs2/hkust/umaconf/train_asr_uma_branchformer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/umaconf/train_asr_uma_branchformer.yaml -------------------------------------------------------------------------------- /egs2/hkust/umaconf/train_asr_uma_branchformer_condition.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/umaconf/train_asr_uma_branchformer_condition.yaml -------------------------------------------------------------------------------- /egs2/hkust/umaconf/train_asr_uma_conformer.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/umaconf/train_asr_uma_conformer.yaml -------------------------------------------------------------------------------- /egs2/hkust/umaconf/train_asr_uma_conformer_condition.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/egs2/hkust/umaconf/train_asr_uma_conformer_condition.yaml -------------------------------------------------------------------------------- /espnet2/asr/decoder/unimodal_attention_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/decoder/unimodal_attention_decoder.py -------------------------------------------------------------------------------- /espnet2/asr/encoder/conformer_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/encoder/conformer_encoder.py -------------------------------------------------------------------------------- /espnet2/asr/encoder/e_branchformer_condition_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/encoder/e_branchformer_condition_encoder.py -------------------------------------------------------------------------------- /espnet2/asr/encoder/mamba_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/encoder/mamba_encoder.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/__init__.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/modules/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/modules/mamba_simple.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/modules/mamba_simple.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/__pycache__/__init__.cpython-39.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/__pycache__/__init__.cpython-39.pyc -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/__pycache__/selective_scan_interface.cpython-39.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/__pycache__/selective_scan_interface.cpython-39.pyc -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/selective_scan_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/selective_scan_interface.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/triton/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/triton/__pycache__/__init__.cpython-39.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/triton/__pycache__/__init__.cpython-39.pyc -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/triton/__pycache__/layernorm.cpython-39.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/triton/__pycache__/layernorm.cpython-39.pyc -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/triton/__pycache__/selective_state_update.cpython-39.pyc: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/triton/__pycache__/selective_state_update.cpython-39.pyc -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/triton/layernorm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/triton/layernorm.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/ops/triton/selective_state_update.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/ops/triton/selective_state_update.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/utils/generation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/utils/generation.py -------------------------------------------------------------------------------- /espnet2/asr/mamba_ssm/utils/hf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/mamba_ssm/utils/hf.py -------------------------------------------------------------------------------- /espnet2/asr/uma.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/uma.py -------------------------------------------------------------------------------- /espnet2/asr/unimodal_attention_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/asr/unimodal_attention_model.py -------------------------------------------------------------------------------- /espnet2/bin/asr_unimodal_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/bin/asr_unimodal_inference.py -------------------------------------------------------------------------------- /espnet2/bin/asr_unimodal_train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/bin/asr_unimodal_train.py -------------------------------------------------------------------------------- /espnet2/tasks/asr_unimodal.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/espnet2/tasks/asr_unimodal.py -------------------------------------------------------------------------------- /mamba_uma.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/mamba_uma.png -------------------------------------------------------------------------------- /uma.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/Audio-WestlakeU/UMA-ASR/HEAD/uma.png --------------------------------------------------------------------------------