├── src ├── .version ├── lm │ ├── examples │ │ ├── input3.fst │ │ ├── input4.fst │ │ ├── YEARDATE.txt │ │ ├── input4.txt │ │ ├── MONTH.txt │ │ ├── input3.txt │ │ ├── DAYOFMONTH.txt │ │ ├── YEAR.txt │ │ └── CREATURE.txt │ ├── test_data │ │ ├── missing_backoffs.arpa │ │ ├── input.arpa │ │ └── unused_backoffs.arpa │ ├── irstlm.mk │ └── Makefile ├── nnet2bin │ └── raw-nnet-init ├── gst-plugin │ └── kaldimarshal.list ├── doc │ ├── Kaldi.pptx │ ├── KaldiMatrix.pptx │ ├── KaldiModels.pptx │ └── KaldiScripts.pptx ├── feat │ └── test_data │ │ ├── test.wav │ │ ├── test.wav.fbank_htk.1 │ │ ├── test.wav.fbank_htk.2 │ │ ├── test.wav.fbank_htk.3 │ │ ├── test.wav.fbank_htk.4 │ │ ├── test.wav.fea_htk.1 │ │ ├── test.wav.fea_htk.2 │ │ ├── test.wav.fea_htk.3 │ │ ├── test.wav.fea_htk.4 │ │ ├── test.wav.fea_htk.5 │ │ ├── test.wav.fea_htk.6 │ │ ├── test.wav.plp_htk.1 │ │ └── prepare_wav_in_ascii.m ├── onlinebin │ └── java-online-audio-client │ │ └── MANIFEST.MF ├── probe │ └── Makefile.slow_expf ├── lmbin │ └── Makefile ├── kws │ └── Makefile └── hmm │ └── Makefile ├── egs ├── lre07 │ ├── v2 │ │ ├── lid │ │ ├── sid │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── vad.conf │ │ │ ├── logistic-regression.conf │ │ │ ├── mfcc_asr.conf │ │ │ ├── mfcc_vtln.conf │ │ │ └── mfcc.conf │ │ ├── local │ │ │ ├── lre07_eval │ │ │ │ └── score_lre07.v01d.pl │ │ │ ├── general_lr_closed_set_langs.txt │ │ │ └── dnn │ │ │ │ └── README │ │ └── path.sh │ └── v1 │ │ ├── sid │ │ ├── steps │ │ ├── utils │ │ ├── lid │ │ ├── nnet2 │ │ │ └── relabel_egs2.sh │ │ └── README.txt │ │ ├── conf │ │ ├── vad.conf │ │ ├── logistic-regression.conf │ │ ├── mfcc.conf │ │ └── mfcc_vtln.conf │ │ ├── local │ │ └── general_lr_closed_set_langs.txt │ │ └── path.sh ├── sre10 │ ├── v2 │ │ ├── sid │ │ ├── local │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── vad.conf │ │ │ ├── decode_dnn.config │ │ │ ├── mfcc_asr.conf │ │ │ ├── decode.config │ │ │ └── mfcc.conf │ │ └── path.sh │ └── v1 │ │ ├── sid │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── vad.conf │ │ └── mfcc.conf │ │ ├── local │ │ └── dnn │ │ │ └── README │ │ └── path.sh ├── ssar │ └── s5 │ │ └── RESULTS ├── gp │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── mfcc.conf │ │ │ ├── sgmm.conf │ │ │ ├── tri.conf │ │ │ └── lang_codes.txt │ │ └── local │ │ │ └── gp_norm_trans_CZ.pl │ └── s1 │ │ └── conf │ │ ├── mfcc.conf │ │ └── lang_codes.txt ├── lre │ ├── v1 │ │ ├── sid │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── vad.conf │ │ │ ├── logistic-regression.conf │ │ │ ├── mfcc.conf │ │ │ └── mfcc_vtln.conf │ │ ├── local │ │ │ └── callfriend_lang.txt │ │ ├── lid │ │ │ └── README.txt │ │ └── path.sh │ └── README.txt ├── rm │ └── s5 │ │ ├── conf │ │ ├── pitch_process.conf │ │ ├── plp.conf │ │ ├── mfcc.conf │ │ ├── pitch.conf │ │ ├── online_cmvn.conf │ │ ├── decode.config │ │ ├── fbank.conf │ │ └── decode_dnn.config │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ └── path.sh ├── ami │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── pitch.conf │ │ │ ├── mfcc.conf │ │ │ ├── decode_tandem.conf │ │ │ ├── online_cmvn.conf │ │ │ ├── decode.conf │ │ │ ├── decode_dnn.conf │ │ │ ├── fbank.conf │ │ │ ├── queue_jsalt.conf │ │ │ └── queue_no_k20.conf │ │ └── local │ │ │ ├── english.glm │ │ │ ├── split_eval.orig │ │ │ ├── split_dev.orig │ │ │ └── split_REAMDE.txt │ └── s5b │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── chain │ │ │ ├── run_tdnn.sh │ │ │ ├── run_tdnn_lstm.sh │ │ │ └── multi_condition │ │ │ │ └── run_tdnn_lstm.sh │ │ ├── english.glm │ │ ├── split_dev.orig │ │ ├── split_eval.orig │ │ ├── split_train.orig │ │ └── split_REAMDE.txt │ │ └── conf │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── decode.conf ├── an4 │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ ├── conf │ │ ├── mfcc.conf │ │ └── decode.config │ │ ├── README.md │ │ ├── path.sh │ │ └── RESULTS ├── aspire │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ └── chain │ │ │ │ ├── run_tdnn.sh │ │ │ │ └── run_blstm.sh │ │ ├── conf │ │ │ ├── pitch.conf │ │ │ ├── online_cmvn.conf │ │ │ ├── mfcc.conf │ │ │ ├── voiced_feat.conf │ │ │ ├── decode_dnn.config │ │ │ ├── decode.config │ │ │ └── queue_no_k20.conf │ │ └── path.sh │ └── README.txt ├── aurora4 │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── decode_dnn.config │ │ ├── train_dnn.config │ │ ├── train_dnn_1.config │ │ ├── train_nnet.config │ │ ├── train_dnn_2.config │ │ └── fbank.conf │ │ ├── local │ │ ├── run_nnet_cpu.sh │ │ └── dict │ │ │ └── reverse_dict.pl │ │ └── path.sh ├── babel │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── kws_score.sh │ │ │ ├── eval_kw_subsets.sh │ │ │ └── dict │ │ │ │ └── reverse_dict.pl │ │ └── conf │ │ │ ├── plp.conf │ │ │ ├── glm │ │ │ └── common_vars.sh │ ├── s5b │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── kws_score.sh │ │ │ ├── datasets │ │ │ │ ├── unsupervised_seg.sh │ │ │ │ └── unsupervised_uem.sh │ │ │ └── eval_kw_subsets.sh │ │ ├── conf │ │ │ ├── pitch.conf │ │ │ ├── plp.conf │ │ │ └── glm │ │ └── path.sh │ ├── s5c │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── kws_score.sh │ │ │ ├── datasets │ │ │ │ ├── unsupervised_seg.sh │ │ │ │ └── unsupervised_uem.sh │ │ │ └── eval_kw_subsets.sh │ │ ├── conf │ │ │ ├── pitch.conf │ │ │ ├── plp.conf │ │ │ └── glm │ │ └── path.sh │ └── s5d │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── score.sh │ │ ├── kws_score.sh │ │ ├── datasets │ │ │ ├── unsupervised_seg.sh │ │ │ └── unsupervised_uem.sh │ │ ├── eval_kw_subsets.sh │ │ └── make_wordlist.sh │ │ ├── conf │ │ ├── pitch.conf │ │ ├── plp.conf │ │ ├── online_cmvn.conf │ │ ├── mfcc.conf │ │ └── glm │ │ └── RUN_UNICODE_SYSTEM ├── chime1 │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── mfcc.conf │ │ └── queue_usfd.conf │ │ ├── path.sh │ │ └── config.sh ├── chime2 │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── decode_dnn.config │ │ └── fbank.conf │ │ └── path.sh ├── chime3 │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── decode_dnn.config │ │ └── fbank.conf │ │ └── path.sh ├── chime4 │ ├── s5_2ch │ │ ├── local │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── mfcc.conf │ │ │ ├── decode_dnn.config │ │ │ └── fbank.conf │ │ └── path.sh │ ├── s5_6ch │ │ ├── local │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── mfcc.conf │ │ │ ├── decode_dnn.config │ │ │ └── fbank.conf │ │ └── path.sh │ └── s5_1ch │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── decode_dnn.config │ │ └── fbank.conf │ │ └── path.sh ├── cifar │ ├── v1 │ │ ├── steps │ │ ├── utils │ │ ├── image │ │ │ └── README.txt │ │ └── path.sh │ └── README.txt ├── csj │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── score.sh │ │ ├── wer_hyp_filter │ │ └── wer_ref_filter │ │ ├── conf │ │ ├── fbank_40.conf │ │ ├── plp.conf │ │ ├── pitch.conf │ │ ├── decode_tandem.config │ │ ├── mfcc.conf │ │ ├── decode.config │ │ ├── online_cmvn.conf │ │ ├── decode_dnn.config │ │ └── fbank.conf │ │ └── path.sh ├── fame │ └── s5 │ │ ├── cmd.sh │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── score.sh │ │ ├── wer_hyp_filter │ │ ├── wer_output_filter │ │ └── wer_ref_filter │ │ ├── conf │ │ ├── fbank.conf │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── decode_dnn.config │ │ └── path.sh ├── hkust │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── pitch.conf │ │ │ ├── online_pitch.conf │ │ │ ├── online_cmvn.conf │ │ │ ├── mfcc.conf │ │ │ ├── decode.config │ │ │ ├── pinyin_initial │ │ │ ├── fbank.conf │ │ │ └── cmu2pinyin │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── wer_hyp_filter │ │ │ ├── wer_ref_filter │ │ │ └── hkust_segment.py │ │ └── path.sh │ └── README.txt ├── iban │ └── s5 │ │ ├── conf │ │ ├── decode_dnn.config │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── decode.config │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ ├── cmd.sh │ │ └── path.sh ├── reverb │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── flist2scp.pl │ │ ├── score_mbr.sh │ │ └── normalize_transcript.pl │ │ ├── conf │ │ ├── fbank.conf │ │ ├── mfcc.conf │ │ └── decode_dnn.config │ │ └── path.sh ├── sre08 │ └── v1 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── vad.conf │ │ └── mfcc.conf │ │ └── path.sh ├── svhn │ ├── v1 │ │ ├── image │ │ ├── steps │ │ ├── utils │ │ └── path.sh │ └── README.txt ├── swahili │ └── s5 │ │ ├── conf │ │ ├── steps │ │ ├── utils │ │ ├── cmd.sh │ │ └── local │ │ └── prepare_lm.sh ├── swbd │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── mfcc.conf │ │ │ ├── decode.config │ │ │ ├── decode_dnn.config │ │ │ └── fbank.conf │ │ └── path.sh │ ├── s5b │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── pitch.conf │ │ │ ├── decode_tandem.config │ │ │ ├── online_cmvn.conf │ │ │ ├── mfcc.conf │ │ │ ├── decode.config │ │ │ ├── decode_dnn.config │ │ │ └── fbank.conf │ │ └── path.sh │ └── s5c │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── pitch.conf │ │ ├── decode_tandem.config │ │ ├── decode_online.config │ │ ├── online_cmvn.conf │ │ ├── mfcc.conf │ │ ├── decode.config │ │ ├── decode_dnn.config │ │ └── fbank.conf │ │ ├── local │ │ ├── chain │ │ │ ├── run_lstm.sh │ │ │ ├── run_tdnn.sh │ │ │ ├── run_blstm.sh │ │ │ ├── run_tdnn_lstm.sh │ │ │ ├── run_tdnn_blstm.sh │ │ │ └── compare_wer_tdnn.sh │ │ ├── nnet3 │ │ │ ├── run_tdnn.sh │ │ │ ├── run_tdnn_disc.sh │ │ │ ├── run_tdnn_lfr.sh │ │ │ └── run_tdnn_lfr_disc.sh │ │ └── MSU_single_letter.txt │ │ └── path.sh ├── tedlium │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── nnet3 │ │ │ │ └── README │ │ │ └── chain │ │ │ │ └── README │ │ ├── conf │ │ │ ├── decode.config │ │ │ ├── mfcc.conf │ │ │ ├── pitch.conf │ │ │ ├── online_cmvn.conf │ │ │ ├── decode_dnn.config │ │ │ ├── fbank.conf │ │ │ └── no_k20.conf │ │ └── path.sh │ ├── s5_r2 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── chain │ │ │ │ ├── run_tdnn.sh │ │ │ │ ├── run_tdnn_lstm.sh │ │ │ │ └── run_tdnn_lstm_disc.sh │ │ │ └── nnet3 │ │ │ │ ├── run_lstm.sh │ │ │ │ ├── run_tdnn.sh │ │ │ │ ├── run_tdnn_lstm.sh │ │ │ │ ├── run_tdnn_lstm_disc.sh │ │ │ │ └── run_tdnn_lstm_lfr.sh │ │ ├── conf │ │ │ ├── decode.config │ │ │ ├── mfcc.conf │ │ │ ├── pitch.conf │ │ │ ├── online_cmvn.conf │ │ │ ├── decode_dnn.config │ │ │ ├── fbank.conf │ │ │ └── no_k20.conf │ │ └── path.sh │ └── s5_r2_wsj │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── score.sh │ │ ├── dict │ │ ├── download_data.sh │ │ ├── flist2scp.pl │ │ ├── join_suffix.py │ │ ├── ndx2flist.pl │ │ ├── run_segmentation_wsj.sh │ │ ├── find_transcripts.pl │ │ └── normalize_transcript.pl │ │ ├── conf │ │ ├── decode.config │ │ ├── mfcc.conf │ │ ├── pitch.conf │ │ ├── online_cmvn.conf │ │ ├── decode_dnn.config │ │ ├── fbank.conf │ │ └── no_k20.conf │ │ └── path.sh ├── timit │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── fbank.conf │ │ └── test_spk.list │ │ └── path.sh ├── wsj │ └── s5 │ │ ├── steps │ │ ├── decode_si.sh │ │ ├── train_nnet.sh │ │ ├── append_feats.sh │ │ ├── decode_nnet.sh │ │ ├── tandem │ │ │ └── decode_si.sh │ │ ├── score_kaldi.sh │ │ ├── score_kaldi_compare.sh │ │ ├── nnet2 │ │ │ └── get_num_frames.sh │ │ └── libs │ │ │ ├── nnet3 │ │ │ ├── report │ │ │ │ └── __init__.py │ │ │ ├── xconfig │ │ │ │ └── layers.py │ │ │ ├── train │ │ │ │ ├── chain_objf │ │ │ │ │ └── __init__.py │ │ │ │ ├── frame_level_objf │ │ │ │ │ └── __init__.py │ │ │ │ └── __init__.py │ │ │ └── __init__.py │ │ │ └── __init__.py │ │ ├── local │ │ ├── score.sh │ │ ├── chain │ │ │ ├── run_tdnn.sh │ │ │ └── run_tdnn_lstm.sh │ │ ├── nnet3 │ │ │ ├── run_tdnn.sh │ │ │ ├── run_tdnn_lstm.sh │ │ │ ├── run_tdnn_lstm_lfr.sh │ │ │ └── run_tdnn_lstm_disc.sh │ │ ├── wer_hyp_filter │ │ ├── wer_ref_filter │ │ ├── wer_output_filter │ │ └── dict │ │ │ └── reverse_dict.pl │ │ ├── utils │ │ ├── data │ │ │ ├── split_data.sh │ │ │ ├── combine_data.sh │ │ │ ├── copy_data_dir.sh │ │ │ ├── fix_data_dir.sh │ │ │ ├── subset_data_dir.sh │ │ │ ├── validate_data_dir.sh │ │ │ └── perturb_data_dir_speed.sh │ │ ├── lang │ │ │ ├── prepare_lang.sh │ │ │ ├── validate_lang.pl │ │ │ └── add_lex_disambig.pl │ │ └── filt.py │ │ ├── conf │ │ ├── fbank.conf │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── decode_dnn.config │ │ └── path.sh ├── yesno │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── input │ │ │ ├── phones.txt │ │ │ ├── lexicon_nosil.txt │ │ │ ├── lexicon.txt │ │ │ └── task.arpabo │ │ ├── conf │ │ │ └── mfcc.conf │ │ ├── local │ │ │ ├── create_yesno_wav_scp.pl │ │ │ ├── create_yesno_txt.pl │ │ │ └── prepare_dict.sh │ │ └── path.sh │ └── README.txt ├── farsdat │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── fbank.conf │ │ ├── test_spk.list │ │ └── dev_spk.list │ │ └── path.sh ├── fisher_swbd │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── online_cmvn.conf │ │ ├── mfcc.conf │ │ ├── decode.config │ │ └── MSU_single_letter.txt │ │ └── path.sh ├── gale_arabic │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── decode.config │ │ │ ├── mfcc.conf │ │ │ ├── pitch.conf │ │ │ ├── fbank.conf │ │ │ ├── online_cmvn.conf │ │ │ └── decode_dnn.config │ │ ├── path.sh │ │ └── local │ │ │ ├── test_list │ │ │ └── bad_segments │ └── s5b │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── decode.config │ │ ├── mfcc.conf │ │ └── online_cmvn.conf │ │ ├── local │ │ ├── chain │ │ │ ├── run_tdnn.sh │ │ │ └── run_tdnn_lstm.sh │ │ ├── nnet3 │ │ │ ├── run_lstm.sh │ │ │ └── run_tdnn.sh │ │ ├── test_list │ │ └── bad_segments │ │ └── path.sh ├── gale_mandarin │ ├── s5 │ │ ├── conf │ │ │ ├── decode.config │ │ │ ├── pitch.conf │ │ │ ├── mfcc.conf │ │ │ ├── fbank.conf │ │ │ ├── decode_dnn.config │ │ │ └── cmu2pinyin │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ │ ├── score.sh │ │ │ ├── wer_hyp_filter │ │ │ ├── wer_ref_filter │ │ │ └── gale_segment.py │ │ └── path.sh │ └── README.txt ├── librispeech │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ ├── decode.config │ │ │ ├── mfcc.conf │ │ │ └── online_cmvn.conf │ │ └── local │ │ │ ├── run_nnet2_clean_100.sh │ │ │ └── run_nnet2_clean_460.sh │ └── README.txt ├── multi_en │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── decode.config │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── MSU_single_letter.txt │ │ └── local │ │ ├── ami_split_eval.orig │ │ └── ami_split_dev.orig ├── sprakbanken │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── chain │ │ │ ├── run_lstm.sh │ │ │ ├── run_tdnn.sh │ │ │ └── run_tdnn_lstm.sh │ │ ├── dictsrc │ │ │ └── silence_phones.txt │ │ ├── sprak_run_nnet_cpu.sh │ │ ├── wer_hyp_filter │ │ ├── wer_ref_filter │ │ ├── wer_output_filter │ │ ├── sprak_prep_lm.sh │ │ ├── dict │ │ │ └── reverse_dict.pl │ │ └── generate_results_file.sh │ │ ├── conf │ │ ├── fbank.conf │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── decode_dnn.config │ │ ├── complexphones.txt │ │ └── path.sh ├── thchs30 │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ ├── conf │ │ ├── mfcc.conf │ │ ├── fbank.conf │ │ └── decode_dnn.config │ │ └── path.sh ├── tidigits │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ │ └── mfcc.conf │ │ └── path.sh │ └── README.txt ├── voxforge │ └── s5 │ │ ├── steps │ │ ├── utils │ │ └── conf │ │ ├── mfcc.conf │ │ └── decode.config ├── vystadial_cz │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── common │ │ │ ├── decode.conf │ │ │ └── mfcc.conf │ │ └── local │ │ │ └── create_sample.sh │ └── online_demo │ │ ├── data │ │ └── .gitignore │ │ ├── decode │ │ └── .gitignore │ │ ├── models │ │ └── .gitignore │ │ ├── utils │ │ ├── __init__.py │ │ ├── display_gmm_latgen.sh │ │ └── run_live-demo.sh ├── vystadial_en │ ├── s5 │ │ ├── steps │ │ ├── utils │ │ ├── common │ │ │ ├── decode.conf │ │ │ └── mfcc.conf │ │ └── local │ │ │ └── create_sample.sh │ └── online_demo ├── apiai_decode │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ └── score.sh │ │ └── path.sh ├── babel_multilang │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── plp.conf │ │ ├── mfcc.conf │ │ ├── pitch.conf │ │ ├── common.fullLP │ │ ├── common_vars.sh │ │ ├── mfcc_hires.conf │ │ ├── common.limitedLP │ │ └── online_cmvn.conf │ │ ├── local │ │ ├── score_stm.sh │ │ ├── kws_search.sh │ │ ├── lattice_to_ctm.sh │ │ └── datasets │ │ │ ├── extra_kws.sh │ │ │ ├── vocab_kws.sh │ │ │ ├── supervised_pem.sh │ │ │ ├── unsupervised_seg.sh │ │ │ └── unsupervised_uem.sh │ │ └── path.sh ├── bn_music_speech │ └── v1 │ │ ├── sid │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── vad.conf │ │ └── mfcc.conf │ │ ├── README │ │ └── path.sh ├── callhome_egyptian │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── plp.conf │ │ ├── mfcc.conf │ │ ├── online_cmvn.conf │ │ └── decode.config │ │ ├── path.sh │ │ └── local │ │ └── splits │ │ ├── dev │ │ ├── h5 │ │ ├── sup │ │ └── test ├── fisher_english │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── online_cmvn.conf │ │ ├── mfcc.conf │ │ ├── decode.config │ │ └── decode_dnn.config │ │ ├── local │ │ └── run_nnet2.sh │ │ └── path.sh ├── mini_librispeech │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── chain │ │ │ └── run_tdnn.sh │ │ ├── nnet3 │ │ │ └── run_tdnn_lstm.sh │ │ ├── data_prep.sh │ │ ├── format_lms.sh │ │ └── prepare_dict.sh │ │ ├── conf │ │ ├── mfcc.conf │ │ └── online_cmvn.conf │ │ └── path.sh ├── sprakbanken_swe │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── local │ │ ├── dictsrc │ │ │ ├── optional_silence.txt │ │ │ └── silence_phones.txt │ │ └── sprak_run_nnet_cpu.sh │ │ ├── conf │ │ ├── fbank.conf │ │ ├── mfcc.conf │ │ └── decode_dnn.config │ │ └── path.sh ├── fisher_callhome_spanish │ └── s5 │ │ ├── steps │ │ ├── utils │ │ ├── conf │ │ ├── plp.conf │ │ ├── mfcc.conf │ │ └── decode.config │ │ ├── local │ │ ├── spron.pl │ │ ├── callhome_text_pp.sh │ │ ├── fix_stm.sh │ │ └── splits │ │ │ ├── dev │ │ │ ├── test │ │ │ └── split_callhome │ │ │ ├── dev │ │ │ └── test │ │ └── path.sh └── README.txt ├── tools ├── install_atlas.sh ├── install_speex.sh ├── install_srilm.sh ├── install_portaudio.sh ├── install_pfile_utils.sh └── extras │ ├── install_openblas.sh │ ├── install_sctk_patched.sh │ └── mikolov_rnnlm.patch ├── windows ├── .gitignore ├── NewGuidCmd.exe └── NewGuidCmd.exe.config ├── Kaldi_Pi.png ├── misc ├── logo │ ├── KaldiIco.png │ ├── KaldiLogo.docx │ ├── KaldiLogo.png │ ├── KaldiTextAndLogo.png │ └── KaldiTextAndLogoSmall.png ├── papers │ ├── asru11_toolkit │ │ ├── kaldi_asru.pdf │ │ └── figs │ │ │ └── kaldi-lib.pdf │ ├── asru11_toolkit_poster │ │ ├── kaldi-poster.pdf │ │ ├── figures │ │ │ ├── kaldi-lib.pdf │ │ │ └── KaldiTextAndLogo.png │ │ └── README │ └── icassp12_lat │ │ └── Makefile └── maintenance │ └── check_usage_messages.sh └── INSTALL /src/.version: -------------------------------------------------------------------------------- 1 | 5.2 2 | -------------------------------------------------------------------------------- /egs/lre07/v2/lid: -------------------------------------------------------------------------------- 1 | ../v1/lid -------------------------------------------------------------------------------- /egs/sre10/v2/sid: -------------------------------------------------------------------------------- 1 | ../v1/sid -------------------------------------------------------------------------------- /egs/ssar/s5/RESULTS: -------------------------------------------------------------------------------- 1 | - 2 | -------------------------------------------------------------------------------- /src/lm/examples/input3.fst: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /src/lm/examples/input4.fst: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /egs/gp/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/gp/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/lre/v1/sid: -------------------------------------------------------------------------------- 1 | ../../sre08/v1/sid -------------------------------------------------------------------------------- /egs/rm/s5/conf/pitch_process.conf: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /egs/rm/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/rm/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/sre10/v2/local: -------------------------------------------------------------------------------- 1 | ../v1/local/ -------------------------------------------------------------------------------- /egs/sre10/v2/steps: -------------------------------------------------------------------------------- 1 | ../v1/steps -------------------------------------------------------------------------------- /egs/sre10/v2/utils: -------------------------------------------------------------------------------- 1 | ../v1/utils -------------------------------------------------------------------------------- /egs/ami/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/ami/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/ami/s5b/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/ami/s5b/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/an4/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/an4/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/aspire/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/aspire/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/aurora4/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/aurora4/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/babel/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/babel/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/babel/s5b/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/babel/s5b/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/babel/s5c/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/babel/s5c/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/babel/s5d/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/babel/s5d/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/chime1/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/chime1/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/chime2/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/chime2/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/chime3/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/chime3/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/local: -------------------------------------------------------------------------------- 1 | ../s5_1ch/local -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/local: -------------------------------------------------------------------------------- 1 | ../s5_1ch/local -------------------------------------------------------------------------------- /egs/cifar/v1/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/cifar/v1/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/csj/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/csj/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/fame/s5/cmd.sh: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/cmd.sh -------------------------------------------------------------------------------- /egs/fame/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/fame/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/hkust/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/hkust/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/iban/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /egs/iban/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/iban/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/lre/v1/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/lre/v1/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/lre07/v1/sid: -------------------------------------------------------------------------------- 1 | ../../sre08/v1/sid -------------------------------------------------------------------------------- /egs/lre07/v1/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/lre07/v1/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/lre07/v2/sid: -------------------------------------------------------------------------------- 1 | ../../sre08/v1/sid -------------------------------------------------------------------------------- /egs/lre07/v2/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/lre07/v2/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/reverb/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/reverb/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/sre08/v1/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/sre08/v1/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/sre10/v1/sid: -------------------------------------------------------------------------------- 1 | ../../sre08/v1/sid/ -------------------------------------------------------------------------------- /egs/sre10/v1/steps: -------------------------------------------------------------------------------- 1 | ../../sre08/v1/steps -------------------------------------------------------------------------------- /egs/sre10/v1/utils: -------------------------------------------------------------------------------- 1 | ../../sre08/v1/utils -------------------------------------------------------------------------------- /egs/svhn/v1/image: -------------------------------------------------------------------------------- 1 | ../../cifar/v1/image -------------------------------------------------------------------------------- /egs/svhn/v1/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/svhn/v1/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/swahili/s5/conf: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/conf/ -------------------------------------------------------------------------------- /egs/swbd/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/swbd/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/swbd/s5b/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/swbd/s5b/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/swbd/s5c/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/swbd/s5c/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/tedlium/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/tedlium/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/timit/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/timit/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/wsj/s5/steps/decode_si.sh: -------------------------------------------------------------------------------- 1 | decode.sh -------------------------------------------------------------------------------- /egs/yesno/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/yesno/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /src/nnet2bin/raw-nnet-init: -------------------------------------------------------------------------------- 1 | nnet-init -------------------------------------------------------------------------------- /egs/babel/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | score_sctk.sh -------------------------------------------------------------------------------- /egs/chime4/s5_1ch/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/chime4/s5_1ch/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/farsdat/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/farsdat/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/gale_arabic/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/gale_arabic/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /egs/librispeech/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/librispeech/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/multi_en/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/multi_en/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/sprakbanken/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/sprakbanken/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/swahili/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/swahili/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/thchs30/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/thchs30/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/tidigits/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/tidigits/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/timit/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | score_sclite.sh -------------------------------------------------------------------------------- /egs/voxforge/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/voxforge/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/vystadial_cz/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/vystadial_cz/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/vystadial_en/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/vystadial_en/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/wsj/s5/steps/train_nnet.sh: -------------------------------------------------------------------------------- 1 | nnet/train.sh -------------------------------------------------------------------------------- /egs/an4/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/apiai_decode/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/apiai_decode/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/babel/s5/local/kws_score.sh: -------------------------------------------------------------------------------- 1 | kws_score_f4de.sh -------------------------------------------------------------------------------- /egs/babel/s5b/local/score.sh: -------------------------------------------------------------------------------- 1 | run_kws_stt_task.sh -------------------------------------------------------------------------------- /egs/babel/s5c/local/score.sh: -------------------------------------------------------------------------------- 1 | run_kws_stt_task.sh -------------------------------------------------------------------------------- /egs/babel/s5d/local/score.sh: -------------------------------------------------------------------------------- 1 | run_kws_stt_task.sh -------------------------------------------------------------------------------- /egs/babel_multilang/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/babel_multilang/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/sid: -------------------------------------------------------------------------------- 1 | ../../sre10/v1/sid -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/steps: -------------------------------------------------------------------------------- 1 | ../../sre10/v1/steps -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/utils: -------------------------------------------------------------------------------- 1 | ../../sre10/v1/utils -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/csj/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/farsdat/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | score_sclite.sh -------------------------------------------------------------------------------- /egs/fisher_english/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/fisher_english/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps/ -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils/ -------------------------------------------------------------------------------- /egs/rm/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/tedlium/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | score_sclite.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/score.sh: -------------------------------------------------------------------------------- 1 | score_sclite.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/wsj/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/wsj/s5/steps/append_feats.sh: -------------------------------------------------------------------------------- 1 | paste_feats.sh -------------------------------------------------------------------------------- /egs/wsj/s5/steps/decode_nnet.sh: -------------------------------------------------------------------------------- 1 | nnet/decode.sh -------------------------------------------------------------------------------- /egs/wsj/s5/steps/tandem/decode_si.sh: -------------------------------------------------------------------------------- 1 | decode.sh -------------------------------------------------------------------------------- /src/gst-plugin/kaldimarshal.list: -------------------------------------------------------------------------------- 1 | VOID:STRING 2 | -------------------------------------------------------------------------------- /tools/install_atlas.sh: -------------------------------------------------------------------------------- 1 | extras/install_atlas.sh -------------------------------------------------------------------------------- /tools/install_speex.sh: -------------------------------------------------------------------------------- 1 | extras/install_speex.sh -------------------------------------------------------------------------------- /tools/install_srilm.sh: -------------------------------------------------------------------------------- 1 | extras/install_srilm.sh -------------------------------------------------------------------------------- /egs/babel/s5b/local/kws_score.sh: -------------------------------------------------------------------------------- 1 | kws_score_f4de.sh -------------------------------------------------------------------------------- /egs/babel/s5c/local/kws_score.sh: -------------------------------------------------------------------------------- 1 | kws_score_f4de.sh -------------------------------------------------------------------------------- /egs/babel/s5d/local/kws_score.sh: -------------------------------------------------------------------------------- 1 | kws_score_f4de.sh -------------------------------------------------------------------------------- /egs/csj/s5/conf/fbank_40.conf: -------------------------------------------------------------------------------- 1 | --num-mel-bins=40 2 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/plp.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=16000 2 | -------------------------------------------------------------------------------- /egs/fame/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/iban/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/score.sh: -------------------------------------------------------------------------------- 1 | score_sclite.sh -------------------------------------------------------------------------------- /egs/thchs30/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/data/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/decode/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/models/.gitignore: -------------------------------------------------------------------------------- 1 | * 2 | -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/split_data.sh: -------------------------------------------------------------------------------- 1 | ../split_data.sh -------------------------------------------------------------------------------- /egs/yesno/s5/input/phones.txt: -------------------------------------------------------------------------------- 1 | SIL 2 | Y 3 | N 4 | -------------------------------------------------------------------------------- /tools/install_portaudio.sh: -------------------------------------------------------------------------------- 1 | extras/install_portaudio.sh -------------------------------------------------------------------------------- /egs/ami/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=16000 2 | -------------------------------------------------------------------------------- /egs/ami/s5b/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1e.sh -------------------------------------------------------------------------------- /egs/ami/s5b/local/english.glm: -------------------------------------------------------------------------------- 1 | ../../s5/local/english.glm -------------------------------------------------------------------------------- /egs/apiai_decode/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/score_kaldi.sh -------------------------------------------------------------------------------- /egs/aspire/s5/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_7b.sh -------------------------------------------------------------------------------- /egs/babel/s5/conf/plp.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/babel/s5b/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/babel/s5b/conf/plp.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/babel/s5c/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/babel/s5c/conf/plp.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/babel/s5d/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/babel/s5d/conf/plp.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=16000 2 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/steps: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/steps -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/utils: -------------------------------------------------------------------------------- 1 | ../../wsj/s5/utils -------------------------------------------------------------------------------- /egs/hkust/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/swbd/s5c/local/chain/run_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_lstm_6j.sh -------------------------------------------------------------------------------- /egs/swbd/s5c/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_7k.sh -------------------------------------------------------------------------------- /egs/swbd/s5c/local/nnet3/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_d.sh -------------------------------------------------------------------------------- /egs/vystadial_en/online_demo: -------------------------------------------------------------------------------- 1 | ../vystadial_cz/online_demo/ -------------------------------------------------------------------------------- /egs/wsj/s5/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1b.sh -------------------------------------------------------------------------------- /egs/wsj/s5/local/nnet3/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1a.sh -------------------------------------------------------------------------------- /egs/wsj/s5/steps/score_kaldi.sh: -------------------------------------------------------------------------------- 1 | scoring/score_kaldi_wer.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/combine_data.sh: -------------------------------------------------------------------------------- 1 | ../combine_data.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/copy_data_dir.sh: -------------------------------------------------------------------------------- 1 | ../copy_data_dir.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/fix_data_dir.sh: -------------------------------------------------------------------------------- 1 | ../fix_data_dir.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/lang/prepare_lang.sh: -------------------------------------------------------------------------------- 1 | ../prepare_lang.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/lang/validate_lang.pl: -------------------------------------------------------------------------------- 1 | ../validate_lang.pl -------------------------------------------------------------------------------- /egs/yesno/s5/input/lexicon_nosil.txt: -------------------------------------------------------------------------------- 1 | YES Y 2 | NO N 3 | -------------------------------------------------------------------------------- /tools/install_pfile_utils.sh: -------------------------------------------------------------------------------- 1 | extras/install_pfile_utils.sh -------------------------------------------------------------------------------- /egs/ami/s5b/local/split_dev.orig: -------------------------------------------------------------------------------- 1 | ../../s5/local/split_dev.orig -------------------------------------------------------------------------------- /egs/ami/s5b/local/split_eval.orig: -------------------------------------------------------------------------------- 1 | ../../s5/local/split_eval.orig -------------------------------------------------------------------------------- /egs/aspire/s5/local/chain/run_blstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_blstm_7b.sh -------------------------------------------------------------------------------- /egs/gale_arabic/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | link decode_dnn.config -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/conf/decode.config: -------------------------------------------------------------------------------- 1 | link decode_dnn.config -------------------------------------------------------------------------------- /egs/hkust/s5/conf/online_pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/chain/run_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_lstm_1e.sh -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1b.sh -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/dictsrc/silence_phones.txt: -------------------------------------------------------------------------------- 1 | SIL 2 | -------------------------------------------------------------------------------- /egs/swbd/s5c/local/chain/run_blstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_blstm_6k.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1e.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/nnet3/run_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_lstm_1a.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/nnet3/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1b.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/dict: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/dict/ -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/subset_data_dir.sh: -------------------------------------------------------------------------------- 1 | ../subset_data_dir.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/lang/add_lex_disambig.pl: -------------------------------------------------------------------------------- 1 | ../add_lex_disambig.pl -------------------------------------------------------------------------------- /egs/yesno/s5/input/lexicon.txt: -------------------------------------------------------------------------------- 1 | SIL 2 | YES Y 3 | NO N 4 | -------------------------------------------------------------------------------- /egs/ami/s5b/local/chain/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1j.sh -------------------------------------------------------------------------------- /egs/ami/s5b/local/split_train.orig: -------------------------------------------------------------------------------- 1 | ../../s5/local/split_train.orig -------------------------------------------------------------------------------- /egs/babel/s5b/local/datasets/unsupervised_seg.sh: -------------------------------------------------------------------------------- 1 | supervised_seg.sh -------------------------------------------------------------------------------- /egs/babel/s5b/local/datasets/unsupervised_uem.sh: -------------------------------------------------------------------------------- 1 | supervised_uem.sh -------------------------------------------------------------------------------- /egs/babel/s5c/local/datasets/unsupervised_seg.sh: -------------------------------------------------------------------------------- 1 | supervised_seg.sh -------------------------------------------------------------------------------- /egs/babel/s5c/local/datasets/unsupervised_uem.sh: -------------------------------------------------------------------------------- 1 | supervised_uem.sh -------------------------------------------------------------------------------- /egs/babel/s5d/local/datasets/unsupervised_seg.sh: -------------------------------------------------------------------------------- 1 | supervised_seg.sh -------------------------------------------------------------------------------- /egs/babel/s5d/local/datasets/unsupervised_uem.sh: -------------------------------------------------------------------------------- 1 | supervised_uem.sh -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/plp.conf: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/plp.conf -------------------------------------------------------------------------------- /egs/fame/s5/local/wer_hyp_filter: -------------------------------------------------------------------------------- 1 | #!/bin/sed -f 2 | s:::g 3 | -------------------------------------------------------------------------------- /egs/fame/s5/local/wer_output_filter: -------------------------------------------------------------------------------- 1 | #!/bin/sed -f 2 | s:::g 3 | -------------------------------------------------------------------------------- /egs/fame/s5/local/wer_ref_filter: -------------------------------------------------------------------------------- 1 | #!/bin/sed -f 2 | s:::g 3 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1a.sh -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/local/nnet3/run_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_lstm_1a.sh -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/local/nnet3/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1a.sh -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=16000 2 | -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/local/chain/run_tdnn.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_1c.sh -------------------------------------------------------------------------------- /egs/reverb/s5/local/flist2scp.pl: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/flist2scp.pl -------------------------------------------------------------------------------- /egs/reverb/s5/local/score_mbr.sh: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/score_mbr.sh -------------------------------------------------------------------------------- /egs/rm/s5/conf/plp.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/local/dictsrc/optional_silence.txt: -------------------------------------------------------------------------------- 1 | SIL 2 | -------------------------------------------------------------------------------- /egs/swbd/s5c/local/chain/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1e.sh -------------------------------------------------------------------------------- /egs/swbd/s5c/local/nnet3/run_tdnn_disc.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_d_disc.sh -------------------------------------------------------------------------------- /egs/swbd/s5c/local/nnet3/run_tdnn_lfr.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lfr1c.sh -------------------------------------------------------------------------------- /egs/wsj/s5/local/chain/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a.sh -------------------------------------------------------------------------------- /egs/wsj/s5/local/nnet3/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/validate_data_dir.sh: -------------------------------------------------------------------------------- 1 | ../validate_data_dir.sh -------------------------------------------------------------------------------- /src/lm/examples/YEARDATE.txt: -------------------------------------------------------------------------------- 1 | %#MONTH#% %#DAYOFMONTH#% %#YEAR#% 2 | -------------------------------------------------------------------------------- /src/lm/examples/input4.txt: -------------------------------------------------------------------------------- 1 | He came here on %#YEARDATE#% 2 | -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/mfcc.conf -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/pitch.conf -------------------------------------------------------------------------------- /egs/fame/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | ../steps/scoring/score_kaldi_cer.sh -------------------------------------------------------------------------------- /egs/lre07/v1/lid/nnet2/relabel_egs2.sh: -------------------------------------------------------------------------------- 1 | ../../steps/nnet2/relabel_egs2.sh -------------------------------------------------------------------------------- /egs/reverb/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/chain/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a.sh -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/local/dictsrc/silence_phones.txt: -------------------------------------------------------------------------------- 1 | SIL 2 | SPN 3 | -------------------------------------------------------------------------------- /egs/swbd/s5c/local/chain/run_tdnn_blstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_blstm_1a.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/chain/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1e.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/nnet3/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a.sh -------------------------------------------------------------------------------- /egs/wsj/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/wsj/s5/local/nnet3/run_tdnn_lstm_lfr.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_lfr_1a.sh -------------------------------------------------------------------------------- /egs/wsj/s5/steps/score_kaldi_compare.sh: -------------------------------------------------------------------------------- 1 | scoring/score_kaldi_compare.sh -------------------------------------------------------------------------------- /egs/an4/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false 2 | --sample-frequency=16000 3 | -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/common.fullLP: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/common.fullLP -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/score_stm.sh: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/local/score_stm.sh -------------------------------------------------------------------------------- /egs/fame/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/local/chain/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a.sh -------------------------------------------------------------------------------- /egs/gp/s1/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/gp/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/iban/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/local/nnet3/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1b.sh -------------------------------------------------------------------------------- /egs/rm/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/swbd/s5c/local/nnet3/run_tdnn_lfr_disc.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lfr1c_disc.sh -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | # empty config, just use the defaults. 2 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/download_data.sh: -------------------------------------------------------------------------------- 1 | ../../s5_r2/local/download_data.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/flist2scp.pl: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/flist2scp.pl -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/join_suffix.py: -------------------------------------------------------------------------------- 1 | ../../s5_r2/local/join_suffix.py -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/ndx2flist.pl: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/ndx2flist.pl -------------------------------------------------------------------------------- /egs/wsj/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/wsj/s5/local/nnet3/run_tdnn_lstm_disc.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a_disc.sh -------------------------------------------------------------------------------- /egs/wsj/s5/steps/nnet2/get_num_frames.sh: -------------------------------------------------------------------------------- 1 | ../../utils/data/get_num_frames.sh -------------------------------------------------------------------------------- /egs/wsj/s5/utils/data/perturb_data_dir_speed.sh: -------------------------------------------------------------------------------- 1 | ../perturb_data_dir_speed.sh -------------------------------------------------------------------------------- /src/lm/examples/MONTH.txt: -------------------------------------------------------------------------------- 1 | January 2 | February 3 | March 4 | April 5 | May 6 | -------------------------------------------------------------------------------- /src/lm/examples/input3.txt: -------------------------------------------------------------------------------- 1 | the %#CREATURE#% crossed the street 2 | -------------------------------------------------------------------------------- /egs/ami/s5b/local/chain/multi_condition/run_tdnn_lstm.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a.sh -------------------------------------------------------------------------------- /egs/aspire/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --snip-edges=false 2 | --sample-frequency=8000 3 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/common_vars.sh: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/common_vars.sh -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/mfcc_hires.conf: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/mfcc_hires.conf -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/kws_search.sh: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/local/kws_search.sh -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/conf/plp.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/chime2/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/chime3/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/farsdat/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/librispeech/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | # empty config, just use the defaults. 2 | -------------------------------------------------------------------------------- /egs/reverb/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false 2 | --sample-frequency=16000 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/decode.config: -------------------------------------------------------------------------------- 1 | # empty config, just use the defaults. 2 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/chain/run_tdnn_lstm_disc.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1e_disc.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/nnet3/run_tdnn_lstm_disc.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_1a_disc.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/local/nnet3/run_tdnn_lstm_lfr.sh: -------------------------------------------------------------------------------- 1 | tuning/run_tdnn_lstm_lfr_1a.sh -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/decode.config: -------------------------------------------------------------------------------- 1 | # empty config, just use the defaults. 2 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/run_segmentation_wsj.sh: -------------------------------------------------------------------------------- 1 | tuning/run_segmentation_wsj_e.sh -------------------------------------------------------------------------------- /egs/tidigits/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false 2 | --sample-frequency=20000 3 | -------------------------------------------------------------------------------- /egs/timit/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/voxforge/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /src/lm/examples/DAYOFMONTH.txt: -------------------------------------------------------------------------------- 1 | first 2 | second 3 | third 4 | fourth 5 | fifth 6 | -------------------------------------------------------------------------------- /egs/an4/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | first_beam=16.0 2 | beam=20.0 3 | lattice_beam=10.0 4 | -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/common.limitedLP: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/common.limitedLP -------------------------------------------------------------------------------- /egs/babel_multilang/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/conf/online_cmvn.conf -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/lattice_to_ctm.sh: -------------------------------------------------------------------------------- 1 | ../../../babel/s5d/local/lattice_to_ctm.sh -------------------------------------------------------------------------------- /egs/chime4/s5_1ch/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/conf/plp.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | 3 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/librispeech/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/lre/v1/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/local/data_prep.sh: -------------------------------------------------------------------------------- 1 | ../../../librispeech/s5/local/data_prep.sh -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/local/format_lms.sh: -------------------------------------------------------------------------------- 1 | ../../../librispeech/s5/local/format_lms.sh -------------------------------------------------------------------------------- /egs/reverb/s5/local/normalize_transcript.pl: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/normalize_transcript.pl -------------------------------------------------------------------------------- /egs/sprakbanken/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false 2 | --sample-frequency=16000 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false 2 | --sample-frequency=16000 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/find_transcripts.pl: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/find_transcripts.pl -------------------------------------------------------------------------------- /windows/.gitignore: -------------------------------------------------------------------------------- 1 | variables.props 2 | kaldiwin.props 3 | kaldiwin_projguids.txt 4 | -------------------------------------------------------------------------------- /egs/lre07/v1/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/lre07/v2/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/local/prepare_dict.sh: -------------------------------------------------------------------------------- 1 | ../../../librispeech/s5/local/prepare_dict.sh -------------------------------------------------------------------------------- /egs/multi_en/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | first_beam=16.0 2 | beam=20.0 3 | lattice_beam=10.0 4 | -------------------------------------------------------------------------------- /egs/rm/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --nccf-ballast-online=true # helps for online operation. 2 | 3 | -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | -------------------------------------------------------------------------------- /egs/sre08/v1/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/sre10/v1/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/sre10/v2/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/voxforge/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | first_beam=10.0 2 | beam=13.0 3 | lattice_beam=6.0 4 | -------------------------------------------------------------------------------- /egs/vystadial_cz/s5/common/decode.conf: -------------------------------------------------------------------------------- 1 | beam=12.0 2 | latbeam=6.0 3 | max_active=14000 4 | -------------------------------------------------------------------------------- /egs/vystadial_en/s5/common/decode.conf: -------------------------------------------------------------------------------- 1 | beam=12.0 2 | latbeam=6.0 3 | max_active=14000 4 | -------------------------------------------------------------------------------- /Kaldi_Pi.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/Kaldi_Pi.png -------------------------------------------------------------------------------- /egs/lre07/v2/local/lre07_eval/score_lre07.v01d.pl: -------------------------------------------------------------------------------- 1 | ../../../v1/local/lre07_eval/score_lre07.v01d.pl -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --nccf-ballast-online=true # helps for online operation. 2 | 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/local/normalize_transcript.pl: -------------------------------------------------------------------------------- 1 | ../../../wsj/s5/local/normalize_transcript.pl -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/datasets/extra_kws.sh: -------------------------------------------------------------------------------- 1 | ../../../../babel/s5d/local/datasets/extra_kws.sh -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/datasets/vocab_kws.sh: -------------------------------------------------------------------------------- 1 | ../../../../babel/s5d/local/datasets/vocab_kws.sh -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/conf/vad.conf: -------------------------------------------------------------------------------- 1 | --vad-energy-threshold=5.5 2 | --vad-energy-mean-scale=0.5 3 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --nccf-ballast-online=true # helps for online operation. 2 | 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --nccf-ballast-online=true # helps for online operation. 2 | 3 | -------------------------------------------------------------------------------- /egs/timit/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --htk-compat=true 2 | --window-type=hamming 3 | --num-mel-bins=23 4 | 5 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=16000 3 | -------------------------------------------------------------------------------- /egs/ami/s5b/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=16000 3 | -------------------------------------------------------------------------------- /egs/farsdat/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --htk-compat=true 2 | --window-type=hamming 3 | --num-mel-bins=23 4 | 5 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/pitch.conf: -------------------------------------------------------------------------------- 1 | --nccf-ballast-online=true # helps for online operation. 2 | 3 | -------------------------------------------------------------------------------- /src/doc/Kaldi.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/doc/Kaldi.pptx -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/datasets/supervised_pem.sh: -------------------------------------------------------------------------------- 1 | ../../../../babel/s5d/local/datasets/supervised_pem.sh -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/datasets/unsupervised_seg.sh: -------------------------------------------------------------------------------- 1 | ../../../../babel/s5d/local/datasets/unsupervised_seg.sh -------------------------------------------------------------------------------- /egs/babel_multilang/s5/local/datasets/unsupervised_uem.sh: -------------------------------------------------------------------------------- 1 | ../../../../babel/s5d/local/datasets/unsupervised_uem.sh -------------------------------------------------------------------------------- /egs/thchs30/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | #--sample-frequency=8000 3 | -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/__init__.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python 2 | from __future__ import unicode_literals 3 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/decode_tandem.conf: -------------------------------------------------------------------------------- 1 | beam=16.0 2 | lattice_beam=8.0 3 | scoring_opts="--min-lmwt 20 --max-lmwt 30" 4 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/decode_tandem.config: -------------------------------------------------------------------------------- 1 | beam=16.0 2 | lattice_beam=8.0 3 | scoring_opts="--min-lmwt 20 --max-lmwt 30" 4 | -------------------------------------------------------------------------------- /misc/logo/KaldiIco.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/logo/KaldiIco.png -------------------------------------------------------------------------------- /misc/logo/KaldiLogo.docx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/logo/KaldiLogo.docx -------------------------------------------------------------------------------- /misc/logo/KaldiLogo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/logo/KaldiLogo.png -------------------------------------------------------------------------------- /src/doc/KaldiMatrix.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/doc/KaldiMatrix.pptx -------------------------------------------------------------------------------- /src/doc/KaldiModels.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/doc/KaldiModels.pptx -------------------------------------------------------------------------------- /windows/NewGuidCmd.exe: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/windows/NewGuidCmd.exe -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 3 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --sample-frequency=16000 3 | --num-mel-bins=30 4 | -------------------------------------------------------------------------------- /egs/multi_en/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false 2 | --sample-frequency=8000 3 | --low-freq=20 4 | --high-freq=3700 5 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/decode_tandem.config: -------------------------------------------------------------------------------- 1 | beam=16.0 2 | lattice_beam=8.0 3 | scoring_opts="--min-lmwt 20 --max-lmwt 30" 4 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/decode_tandem.config: -------------------------------------------------------------------------------- 1 | beam=16.0 2 | lattice_beam=8.0 3 | scoring_opts="--min-lmwt 20 --max-lmwt 30" 4 | -------------------------------------------------------------------------------- /egs/thchs30/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | #--sample-frequency=8000 3 | --num-mel-bins=40 4 | -------------------------------------------------------------------------------- /src/doc/KaldiScripts.pptx: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/doc/KaldiScripts.pptx -------------------------------------------------------------------------------- /src/lm/examples/YEAR.txt: -------------------------------------------------------------------------------- 1 | two thousand and ten 2 | two zero one zero 3 | two thousand and nine 4 | two zero zero nine 5 | -------------------------------------------------------------------------------- /egs/ami/s5/local/english.glm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/egs/ami/s5/local/english.glm -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 3 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --sample-frequency=16000 3 | --num-mel-bins=30 4 | -------------------------------------------------------------------------------- /src/feat/test_data/test.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav -------------------------------------------------------------------------------- /src/onlinebin/java-online-audio-client/MANIFEST.MF: -------------------------------------------------------------------------------- 1 | Manifest-Version: 1.0 2 | Class-Path: . 3 | Main-Class: Main 4 | 5 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/ami/s5b/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/chime1/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=16000 # sampled at 16kHz 3 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=16000 # CSJ is sampled at 16kHz 3 | -------------------------------------------------------------------------------- /egs/hkust/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/iban/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/lre/v1/conf/logistic-regression.conf: -------------------------------------------------------------------------------- 1 | --max-steps=20 2 | --normalizer=0.00025 3 | --verbose=3 4 | --power=0.15 5 | --mix-up=90 6 | -------------------------------------------------------------------------------- /egs/rm/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/decode_online.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /misc/logo/KaldiTextAndLogo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/logo/KaldiTextAndLogo.png -------------------------------------------------------------------------------- /egs/aspire/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/aurora4/s5/local/run_nnet_cpu.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | . ./cmd.sh 4 | 5 | 6 | # ... 7 | 8 | local/nnet2/run_5c.sh 9 | 10 | -------------------------------------------------------------------------------- /egs/babel/s5d/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/iban/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | # Use wider-than-normal decoding beams for RM. 2 | first_beam=16.0 3 | beam=20.0 4 | lattice_beam=10.0 5 | -------------------------------------------------------------------------------- /egs/lre07/v1/conf/logistic-regression.conf: -------------------------------------------------------------------------------- 1 | --max-steps=35 2 | --normalizer=0.001 3 | --verbose=3 4 | --power=0.15 5 | --mix-up=150 6 | -------------------------------------------------------------------------------- /egs/lre07/v2/conf/logistic-regression.conf: -------------------------------------------------------------------------------- 1 | --max-steps=35 2 | --normalizer=0.001 3 | --verbose=3 4 | --power=0.15 5 | --mix-up=150 6 | -------------------------------------------------------------------------------- /egs/multi_en/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/rm/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | # Use wider-than-normal decoding beams for RM. 2 | first_beam=16.0 3 | beam=20.0 4 | lattice_beam=10.0 5 | -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/aspire/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/babel/s5d/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/fisher_english/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/gp/s5/local/gp_norm_trans_CZ.pl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/egs/gp/s5/local/gp_norm_trans_CZ.pl -------------------------------------------------------------------------------- /egs/hkust/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/librispeech/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/swbd/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/yesno/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /misc/logo/KaldiTextAndLogoSmall.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/logo/KaldiTextAndLogoSmall.png -------------------------------------------------------------------------------- /egs/csj/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/online/run_online_decoding_nnet2.sh 2 | -------------------------------------------------------------------------------- /egs/fame/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/online/run_online_decoding_nnet2.sh 2 | -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/run_online_decoding.sh 2 | -------------------------------------------------------------------------------- /egs/swbd/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | -------------------------------------------------------------------------------- /egs/wsj/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/online/run_online_decoding_nnet2.sh 2 | -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fbank_htk.1: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fbank_htk.1 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fbank_htk.2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fbank_htk.2 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fbank_htk.3: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fbank_htk.3 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fbank_htk.4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fbank_htk.4 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fea_htk.1: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fea_htk.1 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fea_htk.2: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fea_htk.2 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fea_htk.3: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fea_htk.3 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fea_htk.4: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fea_htk.4 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fea_htk.5: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fea_htk.5 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.fea_htk.6: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.fea_htk.6 -------------------------------------------------------------------------------- /src/feat/test_data/test.wav.plp_htk.1: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/src/feat/test_data/test.wav.plp_htk.1 -------------------------------------------------------------------------------- /egs/ami/s5/conf/decode.conf: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | 4 | -------------------------------------------------------------------------------- /egs/ami/s5b/conf/decode.conf: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | 4 | -------------------------------------------------------------------------------- /egs/fisher_english/s5/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/online/run_online_decoding_nnet2.sh 2 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/online/run_online_decoding_nnet2.sh 2 | -------------------------------------------------------------------------------- /egs/yesno/s5/input/task.arpabo: -------------------------------------------------------------------------------- 1 | 2 | \data\ 3 | ngram 1=4 4 | 5 | \1-grams: 6 | -1 NO 7 | -1 YES 8 | -99 9 | -1 10 | 11 | \end\ 12 | -------------------------------------------------------------------------------- /misc/papers/asru11_toolkit/kaldi_asru.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/papers/asru11_toolkit/kaldi_asru.pdf -------------------------------------------------------------------------------- /egs/aspire/s5/conf/voiced_feat.conf: -------------------------------------------------------------------------------- 1 | --num-mel-bins=13 2 | --frame-length=35 3 | --snip-edges=false 4 | --padd-extra-zero=true 5 | --sample-frequency=8000 6 | -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/conf/online_cmvn.conf: -------------------------------------------------------------------------------- 1 | # configuration file for apply-cmvn-online, used in the script ../local/online/run_online_decoding_nnet2.sh 2 | -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/decode_dnn.conf: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/cifar/v1/image/README.txt: -------------------------------------------------------------------------------- 1 | This directory contains various scripts that relate to image recognition: specifically, 2 | the recognition of fixed-size images. 3 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/spron.pl: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/egs/fisher_callhome_spanish/s5/local/spron.pl -------------------------------------------------------------------------------- /egs/hkust/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | 4 | 5 | 6 | -------------------------------------------------------------------------------- /egs/reverb/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | latbeam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/sprak_run_nnet_cpu.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | . ./cmd.sh 4 | 5 | 6 | # ... 7 | 8 | local/nnet2/sprak_run_5c.sh $1 $2 $3 9 | 10 | -------------------------------------------------------------------------------- /misc/papers/asru11_toolkit/figs/kaldi-lib.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/papers/asru11_toolkit/figs/kaldi-lib.pdf -------------------------------------------------------------------------------- /egs/aspire/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/chime2/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/chime3/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/fame/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/lre07/v2/conf/mfcc_asr.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | --snip-edges=false 4 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | latbeam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/local/sprak_run_nnet_cpu.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | . ./cmd.sh 4 | 5 | 6 | # ... 7 | 8 | local/nnet2/sprak_run_5c.sh $1 $2 $3 9 | 10 | -------------------------------------------------------------------------------- /egs/sre10/v2/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/sre10/v2/conf/mfcc_asr.conf: -------------------------------------------------------------------------------- 1 | --use-energy=false # only non-default option. 2 | --sample-frequency=8000 # Switchboard is sampled at 8kHz 3 | --snip-edges=false 4 | -------------------------------------------------------------------------------- /egs/swbd/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/thchs30/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/wsj/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/chime4/s5_1ch/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | latbeam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/sre10/v2/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | lattice_beam=6.0 4 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/nnet3/report/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | 3 | # Copyright 2016 Vimal Manohar 4 | # Apache 2.0. 5 | 6 | import log_parse 7 | 8 | __all__ = ["log_parse"] 9 | -------------------------------------------------------------------------------- /misc/papers/asru11_toolkit_poster/kaldi-poster.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/papers/asru11_toolkit_poster/kaldi-poster.pdf -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | # Use wider-than-normal decoding beams for RM. 2 | first_beam=16.0 3 | beam=20.0 4 | lat_beam=10.0 5 | min_lmwt=2 6 | max_lmwt=10 7 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | # Use wider-than-normal decoding beams. 2 | first_beam=16.0 3 | beam=20.0 4 | lat_beam=10.0 5 | min_lmwt=2 6 | max_lmwt=10 7 | -------------------------------------------------------------------------------- /egs/fisher_english/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=11.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | lattice_beam=6.0 4 | -------------------------------------------------------------------------------- /egs/fisher_english/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=18.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=10.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | lattice_beam=8.0 # this has most effect on size of the lattices. 3 | -------------------------------------------------------------------------------- /src/probe/Makefile.slow_expf: -------------------------------------------------------------------------------- 1 | 2 | all: 3 | include ../kaldi.mk 4 | 5 | CXXFLAGS += -O0 6 | 7 | BINFILES = exp-test 8 | 9 | include ../makefiles/default_rules.mk 10 | -------------------------------------------------------------------------------- /egs/hkust/s5/local/score.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | set -e -o pipefail 4 | set -x 5 | steps/score_kaldi.sh "$@" 6 | steps/score_kaldi_cer.sh --stage 2 "$@" 7 | 8 | echo "$0: Done" 9 | -------------------------------------------------------------------------------- /misc/papers/asru11_toolkit_poster/figures/kaldi-lib.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/papers/asru11_toolkit_poster/figures/kaldi-lib.pdf -------------------------------------------------------------------------------- /egs/swbd/s5c/local/chain/compare_wer_tdnn.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | models="" 4 | for x in $*; do models="$models tdnn_${x}"; done 5 | 6 | local/chain/compare_wer_general.sh $models 7 | -------------------------------------------------------------------------------- /egs/aspire/s5/conf/decode.config: -------------------------------------------------------------------------------- 1 | beam=13.0 # beam for decoding. Was 13.0 in the scripts. 2 | first_beam=8.0 # beam for 1st-pass decoding in SAT. 3 | lattice_beam=8.0 4 | max_active=10000 5 | -------------------------------------------------------------------------------- /egs/hkust/s5/conf/pinyin_initial: -------------------------------------------------------------------------------- 1 | B 2 | C 3 | CH 4 | D 5 | F 6 | G 7 | H 8 | J 9 | K 10 | L 11 | M 12 | N 13 | P 14 | Q 15 | R 16 | S 17 | SH 18 | T 19 | W 20 | X 21 | Y 22 | Z 23 | ZH 24 | -------------------------------------------------------------------------------- /egs/iban/s5/cmd.sh: -------------------------------------------------------------------------------- 1 | #export train_cmd="run.pl --max-jobs-run 32" 2 | #export decode_cmd="run.pl --max-jobs-run 32" 3 | 4 | export train_cmd="queue.pl" 5 | export decode_cmd="queue.pl --mem 4G" 6 | -------------------------------------------------------------------------------- /misc/papers/asru11_toolkit_poster/figures/KaldiTextAndLogo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/saeidmokaram/Kaldi-on-RaspberryPi2/HEAD/misc/papers/asru11_toolkit_poster/figures/KaldiTextAndLogo.png -------------------------------------------------------------------------------- /egs/swahili/s5/cmd.sh: -------------------------------------------------------------------------------- 1 | # JHU cluster options 2 | export train_cmd="queue.pl" 3 | export decode_cmd="queue.pl --mem 4G" 4 | export cuda_cmd="queue --gpu 1" 5 | export mkgraph_cmd="queue.pl --mem 4G" 6 | -------------------------------------------------------------------------------- /windows/NewGuidCmd.exe.config: -------------------------------------------------------------------------------- 1 | 2 | 3 | 4 | 5 | 6 | 7 | -------------------------------------------------------------------------------- /egs/lre/v1/local/callfriend_lang.txt: -------------------------------------------------------------------------------- 1 | 48 french 2 | 49 arabic.standard 3 | 54 korean 4 | 55 chinese.mandarin.mainland 5 | 56 chinese.mandarin.taiwan 6 | 57 spanish.caribbean 7 | 58 spanish.noncaribbean 8 | -------------------------------------------------------------------------------- /src/lm/examples/CREATURE.txt: -------------------------------------------------------------------------------- 1 | boy 2 | boy 3 | boy 4 | boy 5 | boy 6 | boy 7 | boy 8 | girl 9 | girl 10 | pretty girl 11 | cat 12 | dog 13 | dog 14 | dog 15 | rat 16 | red faced clown 17 | green caterpillar 18 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/train_dnn.config: -------------------------------------------------------------------------------- 1 | momentum=0 2 | l1_penalty=0 3 | l2_penalty=0 4 | max_iters=25 5 | min_iters= 6 | start_halving_inc=0.5 7 | end_halving_inc=0.1 8 | halving_factor=0.7 9 | cache_size=32768 10 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/train_dnn_1.config: -------------------------------------------------------------------------------- 1 | momentum=0 2 | l1_penalty=0 3 | l2_penalty=0 4 | max_iters=30 5 | min_iters= 6 | start_halving_inc=0.5 7 | end_halving_inc=0.1 8 | halving_factor=0.5 9 | cache_size=65536 10 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/train_nnet.config: -------------------------------------------------------------------------------- 1 | momentum=0 2 | l1_penalty=0 3 | l2_penalty=0 4 | max_iters=25 5 | min_iters= 6 | start_halving_inc=0.5 7 | end_halving_inc=0.1 8 | halving_factor=0.7 9 | cache_size=32768 10 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/train_dnn_2.config: -------------------------------------------------------------------------------- 1 | momentum=0.9 2 | l1_penalty=0 3 | l2_penalty=0 4 | max_iters=10 5 | min_iters=10 6 | start_halving_inc=0.5 7 | end_halving_inc=0.1 8 | halving_factor=0.7 9 | cache_size=32768 10 | -------------------------------------------------------------------------------- /egs/lre/v1/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=20 # the default is 25. 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=7 6 | -------------------------------------------------------------------------------- /egs/lre07/v1/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=20 # the default is 25. 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=7 6 | -------------------------------------------------------------------------------- /egs/ami/s5/local/split_eval.orig: -------------------------------------------------------------------------------- 1 | EN2002a 2 | EN2002b 3 | EN2002c 4 | EN2002d 5 | ES2004a 6 | ES2004b 7 | ES2004c 8 | ES2004d 9 | IS1009a 10 | IS1009b 11 | IS1009c 12 | IS1009d 13 | TS3003a 14 | TS3003b 15 | TS3003c 16 | TS3003d 17 | -------------------------------------------------------------------------------- /egs/lre/v1/conf/mfcc_vtln.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=20 # the default is 25. 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=13 6 | -------------------------------------------------------------------------------- /egs/lre/v1/lid/README.txt: -------------------------------------------------------------------------------- 1 | Note: these scripts are mostly the same as the speaker-id scripts in 2 | ../../../sre08/v1/sid, except that they use add-deltas-sdc instead of 3 | add-deltas, and a smaller default ivector dimension (400 vs. 600). 4 | -------------------------------------------------------------------------------- /egs/lre07/v1/conf/mfcc_vtln.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=20 # the default is 25. 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=7 6 | -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/display_gmm_latgen.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | # source the settings 4 | . path.sh 5 | 6 | for n in `cut -d' ' -f1 $wav_scp` ; do 7 | utils/show_lattice.sh --mode save --format svg $n $lattice $wst 8 | done 9 | -------------------------------------------------------------------------------- /misc/papers/asru11_toolkit_poster/README: -------------------------------------------------------------------------------- 1 | 2 | This currently just contains a template I modified from one of Aachen University's. 3 | It needs very updated LaTeX packages to compile-- try to find a machine where you can compile. 4 | [dan] 5 | -------------------------------------------------------------------------------- /tools/extras/install_openblas.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | # to be run from .. 4 | # this script just exists to tell you how you'd make openblas- we actually did it via Makefile rules, 5 | # but it's not a default target. 6 | 7 | make openblas 8 | -------------------------------------------------------------------------------- /egs/lre07/v1/lid/README.txt: -------------------------------------------------------------------------------- 1 | Note: these scripts are mostly the same as the speaker-id scripts in 2 | ../../../sre08/v1/sid, except that they use add-deltas-sdc instead of 3 | add-deltas, and a smaller default ivector dimension (400 vs. 600). 4 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/wer_hyp_filter: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | perl -C -pe 's:::g; s:::g; s:::g' | \ 4 | perl -pe 's/é|è|ë/e/g; s/á|à|ä/a/g; s/ó|ò|ö/o/g; s/ú|ù|ü/u/g; s/É|È|Ë/E/g; s/Ó|Ò|Ö/O/g;' | \ 5 | PERLIO=:utf8 perl -pe '$_=lc' 6 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/wer_ref_filter: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | perl -C -pe 's:::g; s:::g; s:::g' | \ 4 | perl -pe 's/é|è|ë/e/g; s/á|à|ä/a/g; s/ó|ò|ö/o/g; s/ú|ù|ü/u/g; s/É|È|Ë/E/g; s/Ó|Ò|Ö/O/g;' | \ 5 | PERLIO=:utf8 perl -pe '$_=lc' 6 | -------------------------------------------------------------------------------- /egs/gp/s5/conf/sgmm.conf: -------------------------------------------------------------------------------- 1 | CZ 3100 10000 2 | FR 3100 10000 3 | GE 3100 10000 4 | PO 3100 10000 5 | PL 3100 10000 6 | RU 3100 10000 7 | SP 3100 10000 8 | SW 3100 10000 9 | TH 3100 10000 10 | TA 3100 10000 11 | TU 3100 10000 12 | VN 3100 10000 13 | -------------------------------------------------------------------------------- /egs/gp/s5/conf/tri.conf: -------------------------------------------------------------------------------- 1 | CZ 3100 50000 2 | FR 3100 50000 3 | GE 3100 50000 4 | PO 3100 50000 5 | PL 3100 50000 6 | RU 3100 50000 7 | SP 3100 50000 8 | SW 3100 50000 9 | TH 3100 50000 10 | TA 3100 50000 11 | TU 3100 50000 12 | VN 3100 50000 13 | -------------------------------------------------------------------------------- /egs/multi_en/s5/local/ami_split_eval.orig: -------------------------------------------------------------------------------- 1 | EN2002a 2 | EN2002b 3 | EN2002c 4 | EN2002d 5 | ES2004a 6 | ES2004b 7 | ES2004c 8 | ES2004d 9 | IS1009a 10 | IS1009b 11 | IS1009c 12 | IS1009d 13 | TS3003a 14 | TS3003b 15 | TS3003c 16 | TS3003d 17 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/wer_output_filter: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | perl -C -pe 's:::g; s:::g; s:::g' | \ 4 | perl -pe 's/é|è|ë/e/g; s/á|à|ä/a/g; s/ó|ò|ö/o/g; s/ú|ù|ü/u/g; s/É|È|Ë/E/g; s/Ó|Ò|Ö/O/g;' | \ 5 | PERLIO=:utf8 perl -pe '$_=lc' 6 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/callhome_text_pp.sh: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env bash 2 | # Copyright 2014 Gaurav Kumar. Apache 2.0 3 | 4 | if [ $# -gt 0 ]; then 5 | sentence=$1 6 | echo $sentence | sed 's:{^[}]*}:[noise]:' 7 | fi 8 | 9 | 10 | -------------------------------------------------------------------------------- /egs/wsj/s5/local/wer_hyp_filter: -------------------------------------------------------------------------------- 1 | #!/bin/sed -f 2 | s:::g 3 | s:::g 4 | s:::g 5 | s/://g 6 | s/\*//g 7 | s/-HOLDER/HOLDER/g 8 | s/COMPAIGN/CAMPAIGN/g 9 | s/APPROACHES-/APPROACHES/g 10 | s/RESEACHERS/RESEARCHERS/g 11 | 12 | -------------------------------------------------------------------------------- /egs/wsj/s5/local/wer_ref_filter: -------------------------------------------------------------------------------- 1 | #!/bin/sed -f 2 | s:::g 3 | s:::g 4 | s:::g 5 | s/://g 6 | s/\*//g 7 | s/-HOLDER/HOLDER/g 8 | s/COMPAIGN/CAMPAIGN/g 9 | s/APPROACHES-/APPROACHES/g 10 | s/RESEACHERS/RESEARCHERS/g 11 | 12 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | 3 | # Copyright 2016 Vimal Manohar 4 | # Apache 2.0. 5 | 6 | """ This package contains modules and subpackages used in kaldi scripts. 7 | """ 8 | 9 | import common 10 | 11 | __all__ = ["common"] 12 | -------------------------------------------------------------------------------- /egs/ami/s5/local/split_dev.orig: -------------------------------------------------------------------------------- 1 | ES2011a 2 | ES2011b 3 | ES2011c 4 | ES2011d 5 | IB4001 6 | IB4002 7 | IB4003 8 | IB4004 9 | IB4010 10 | IB4011 11 | IS1008a 12 | IS1008b 13 | IS1008c 14 | IS1008d 15 | TS3004a 16 | TS3004b 17 | TS3004c 18 | TS3004d 19 | -------------------------------------------------------------------------------- /egs/lre07/v1/local/general_lr_closed_set_langs.txt: -------------------------------------------------------------------------------- 1 | arabic 0 2 | bengali 1 3 | chinese 2 4 | english 3 5 | farsi 4 6 | german 5 7 | hindustani 6 8 | japanese 7 9 | korean 8 10 | russian 9 11 | spanish 10 12 | tamil 11 13 | thai 12 14 | vietnamese 13 15 | -------------------------------------------------------------------------------- /egs/lre07/v2/local/general_lr_closed_set_langs.txt: -------------------------------------------------------------------------------- 1 | arabic 0 2 | bengali 1 3 | chinese 2 4 | english 3 5 | farsi 4 6 | german 5 7 | hindustani 6 8 | japanese 7 9 | korean 8 10 | russian 9 11 | spanish 10 12 | tamil 11 13 | thai 12 14 | vietnamese 13 15 | -------------------------------------------------------------------------------- /egs/swahili/s5/local/prepare_lm.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | . ./path.sh || die "path.sh expected"; 4 | 5 | cd data 6 | #convert to FST format for Kaldi 7 | arpa2fst --disambig-symbol=#0 --read-symbol-table=lang/words.txt \ 8 | local/swahili.arpa lang/G.fst 9 | -------------------------------------------------------------------------------- /egs/wsj/s5/local/wer_output_filter: -------------------------------------------------------------------------------- 1 | #!/bin/sed -f 2 | s:::g 3 | s:::g 4 | s:::g 5 | s/://g 6 | s/\*//g 7 | s/-HOLDER/HOLDER/g 8 | s/COMPAIGN/CAMPAIGN/g 9 | s/APPROACHES-/APPROACHES/g 10 | s/RESEACHERS/RESEARCHERS/g 11 | 12 | -------------------------------------------------------------------------------- /egs/lre07/v2/conf/mfcc_vtln.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=25 # the default is 25. 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=20 6 | --snip-edges=false 7 | -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/README: -------------------------------------------------------------------------------- 1 | The MUSAN corpus is required for system training. It is available at: 2 | http://www.openslr.org/17/ 3 | 4 | The test requires Broadcast News data. The LDC Catalog numbers are: 5 | Speech LDC97S44 6 | Transcripts LDC97T22 7 | -------------------------------------------------------------------------------- /egs/multi_en/s5/local/ami_split_dev.orig: -------------------------------------------------------------------------------- 1 | ES2011a 2 | ES2011b 3 | ES2011c 4 | ES2011d 5 | IB4001 6 | IB4002 7 | IB4003 8 | IB4004 9 | IB4010 10 | IB4011 11 | IS1008a 12 | IS1008b 13 | IS1008c 14 | IS1008d 15 | TS3004a 16 | TS3004b 17 | TS3004c 18 | TS3004d 19 | -------------------------------------------------------------------------------- /egs/sre08/v1/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=20 # the default is 25. 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=20 # higher than the default which is 12. 6 | -------------------------------------------------------------------------------- /egs/aspire/README.txt: -------------------------------------------------------------------------------- 1 | This recipe is JHU's submission to the ASpIRE challenge. It uses 2 | Fisher-English corpus for training the acoustic and language models. 3 | It uses impulse responses and noises from RWCP, AIR and Reverb2014 4 | databases to create multi-condition data 5 | -------------------------------------------------------------------------------- /egs/tedlium/s5/local/nnet3/README: -------------------------------------------------------------------------------- 1 | To produce the results from: 2 | 3 | "Purely sequence-trained neural networks for ASR based on lattice-free MMI", Povey et al. 4 | 5 | Run the following in order: 6 | 7 | ./run.sh 8 | local/nnet3/run_tdnn.sh 9 | local/nnet3/run_tdnn_discriminative.sh -------------------------------------------------------------------------------- /egs/an4/s5/README.md: -------------------------------------------------------------------------------- 1 | This is a recipe for CMU's [AN4](http://www.speech.cs.cmu.edu/databases/an4/). 2 | 3 | To run, download the Sphere-format database from the link above and extract the files (`tar xvfz an4_sphere.tar.gz`). Then edit `an4_root` in `run.sh` to point to the AN4 directory. 4 | -------------------------------------------------------------------------------- /egs/lre07/v2/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=25 # the default is 25 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=20 # higher than the default which is 12. 6 | --snip-edges=false 7 | -------------------------------------------------------------------------------- /egs/rm/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --use-energy=false # only fbank outputs 3 | --dither=1 4 | --num-mel-bins=40 # 8 filters/octave, 40 filters/16Khz as used by IBM 5 | --htk-compat=true # try to make it compatible with HTK 6 | -------------------------------------------------------------------------------- /egs/sre10/v1/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=25 # the default is 25 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=20 # higher than the default which is 12. 6 | --snip-edges=false 7 | -------------------------------------------------------------------------------- /egs/sre10/v2/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=8000 2 | --frame-length=25 # the default is 25 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=20 # higher than the default which is 12. 6 | --snip-edges=false 7 | -------------------------------------------------------------------------------- /egs/timit/s5/conf/test_spk.list: -------------------------------------------------------------------------------- 1 | mdab0 2 | mwbt0 3 | felc0 4 | mtas1 5 | mwew0 6 | fpas0 7 | mjmp0 8 | mlnt0 9 | fpkt0 10 | mlll0 11 | mtls0 12 | fjlm0 13 | mbpm0 14 | mklt0 15 | fnlp0 16 | mcmj0 17 | mjdh0 18 | fmgd0 19 | mgrt0 20 | mnjm0 21 | fdhc0 22 | mjln0 23 | mpam0 24 | fmld0 25 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/nnet3/xconfig/layers.py: -------------------------------------------------------------------------------- 1 | # Copyright 2016 Johns Hopkins University (Dan Povey) 2 | # 2016 Vijayaditya Peddinti 3 | # 2016 Yiming Wang 4 | # Apache 2.0. 5 | 6 | from basic_layers import * 7 | from convolution import * 8 | from lstm import * 9 | -------------------------------------------------------------------------------- /egs/ami/s5/local/split_REAMDE.txt: -------------------------------------------------------------------------------- 1 | The splits in this directory follow the official AMI Corpus Full-ASR split 2 | on train, dev and eval sets. 3 | 4 | If for some reason ones need to use different split the way to do so is 5 | to create split_*.final versions in this directory and run the recipe. 6 | -------------------------------------------------------------------------------- /egs/ami/s5b/local/split_REAMDE.txt: -------------------------------------------------------------------------------- 1 | The splits in this directory follow the official AMI Corpus Full-ASR split 2 | on train, dev and eval sets. 3 | 4 | If for some reason ones need to use different split the way to do so is 5 | to create split_*.final versions in this directory and run the recipe. 6 | -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --use-energy=false # only fbank outputs 3 | --dither=1 4 | --num-mel-bins=40 # 8 filters/octave, 40 filters/16Khz as used by IBM 5 | --htk-compat=true # try to make it compatible with HTK 6 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --use-energy=false # only fbank outputs 3 | --dither=1 4 | --num-mel-bins=40 # 8 filters/octave, 40 filters/16Khz as used by IBM 5 | --htk-compat=true # try to make it compatible with HTK 6 | -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/conf/mfcc.conf: -------------------------------------------------------------------------------- 1 | --sample-frequency=16000 2 | --frame-length=25 # the default is 25 3 | --low-freq=20 # the default. 4 | --high-freq=3700 # the default is zero meaning use the Nyquist (4k in this case). 5 | --num-ceps=20 # higher than the default which is 12. 6 | --snip-edges=false 7 | -------------------------------------------------------------------------------- /egs/farsdat/s5/conf/test_spk.list: -------------------------------------------------------------------------------- 1 | 007 2 | 010 3 | 032 4 | 037 5 | 044 6 | 090 7 | 097 8 | 125 9 | 139 10 | 143 11 | 152 12 | 155 13 | 167 14 | 172 15 | 181 16 | 212 17 | 213 18 | 219 19 | 225 20 | 233 21 | 236 22 | 242 23 | 250 24 | 273 25 | 274 26 | 275 27 | 280 28 | 283 29 | 288 30 | 295 31 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --use-energy=false # only fbank outputs 3 | --dither=1 4 | --num-mel-bins=40 # 8 filters/octave, 40 filters/16Khz as used by IBM 5 | --htk-compat=true # try to make it compatible with HTK 6 | -------------------------------------------------------------------------------- /INSTALL: -------------------------------------------------------------------------------- 1 | This is the official Kaldi INSTALL. Look also at INSTALL.md for the git mirror installation. 2 | [for native Windows install, see windows/INSTALL] 3 | 4 | (1) 5 | go to tools/ and follow INSTALL instructions there. 6 | 7 | (2) 8 | go to src/ and follow INSTALL instructions there. 9 | 10 | -------------------------------------------------------------------------------- /egs/yesno/s5/local/create_yesno_wav_scp.pl: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | $waves_dir = $ARGV[0]; 4 | $in_list = $ARGV[1]; 5 | 6 | open IL, $in_list; 7 | 8 | while ($l = ) 9 | { 10 | chomp($l); 11 | $full_path = $waves_dir . "\/" . $l; 12 | $l =~ s/\.wav//; 13 | print "$l $full_path\n"; 14 | } 15 | -------------------------------------------------------------------------------- /egs/fisher_english/s5/local/run_nnet2.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | 4 | # This shows what you can potentially run; you'd probably want to pick and choose. 5 | # The ones with _gpu in their name are tuned for GPUs. 6 | 7 | 8 | use_gpu=true 9 | 10 | if $use_gpu; then 11 | local/nnet2/run_6c_gpu.sh 12 | fi 13 | 14 | -------------------------------------------------------------------------------- /egs/gp/s1/conf/lang_codes.txt: -------------------------------------------------------------------------------- 1 | AR Arabic 2 | BL Bulgarian 3 | CR Croatian 4 | CZ Czech 5 | FR French 6 | GE German 7 | JA Japanese 8 | KO Korean 9 | CH Mandarin 10 | PL Polish 11 | PO Portuguese 12 | RU Russian 13 | SP Spanish 14 | SW Swedish 15 | TA Tamil 16 | TH Thai 17 | TU Turkish 18 | VN Vietnamese 19 | WU Wu 20 | -------------------------------------------------------------------------------- /egs/gp/s5/conf/lang_codes.txt: -------------------------------------------------------------------------------- 1 | AR Arabic 2 | BL Bulgarian 3 | CR Croatian 4 | CZ Czech 5 | FR French 6 | GE German 7 | JA Japanese 8 | KO Korean 9 | CH Mandarin 10 | PL Polish 11 | PO Portuguese 12 | RU Russian 13 | SP Spanish 14 | SW Swedish 15 | TA Tamil 16 | TH Thai 17 | TU Turkish 18 | VN Vietnamese 19 | WU Wu 20 | -------------------------------------------------------------------------------- /egs/babel/s5/local/eval_kw_subsets.sh: -------------------------------------------------------------------------------- 1 | KWSEval -e ecf.xml -r rttm -t keyword_outvocab.xml -s kwslist.xml -c -o -b -d -f ./kws/outvocab 2 | KWSEval -e ecf.xml -r rttm -t keyword_invocab.xml -s kwslist.xml -c -o -b -d -f ./kws/invocab 3 | KWSEval -e ecf.xml -r rttm -t kws.xml -s kwslist.xml -c -o -b -d -f ./kws/fullvocab 4 | 5 | -------------------------------------------------------------------------------- /egs/babel/s5b/local/eval_kw_subsets.sh: -------------------------------------------------------------------------------- 1 | KWSEval -e ecf.xml -r rttm -t keyword_outvocab.xml -s kwslist.xml -c -o -b -d -f ./kws/outvocab 2 | KWSEval -e ecf.xml -r rttm -t keyword_invocab.xml -s kwslist.xml -c -o -b -d -f ./kws/invocab 3 | KWSEval -e ecf.xml -r rttm -t kws.xml -s kwslist.xml -c -o -b -d -f ./kws/fullvocab 4 | 5 | -------------------------------------------------------------------------------- /egs/babel/s5c/local/eval_kw_subsets.sh: -------------------------------------------------------------------------------- 1 | KWSEval -e ecf.xml -r rttm -t keyword_outvocab.xml -s kwslist.xml -c -o -b -d -f ./kws/outvocab 2 | KWSEval -e ecf.xml -r rttm -t keyword_invocab.xml -s kwslist.xml -c -o -b -d -f ./kws/invocab 3 | KWSEval -e ecf.xml -r rttm -t kws.xml -s kwslist.xml -c -o -b -d -f ./kws/fullvocab 4 | 5 | -------------------------------------------------------------------------------- /egs/babel/s5d/local/eval_kw_subsets.sh: -------------------------------------------------------------------------------- 1 | KWSEval -e ecf.xml -r rttm -t keyword_outvocab.xml -s kwslist.xml -c -o -b -d -f ./kws/outvocab 2 | KWSEval -e ecf.xml -r rttm -t keyword_invocab.xml -s kwslist.xml -c -o -b -d -f ./kws/invocab 3 | KWSEval -e ecf.xml -r rttm -t kws.xml -s kwslist.xml -c -o -b -d -f ./kws/fullvocab 4 | 5 | -------------------------------------------------------------------------------- /egs/cifar/README.txt: -------------------------------------------------------------------------------- 1 | 2 | This directory contains example scripts for image classification with the 3 | CIFAR-10 and CIFAR-100 datasets, which are available for free from 4 | https://www.cs.toronto.edu/~kriz/cifar.html. 5 | 6 | This demonstrates applying the nnet3 framework to image classification for 7 | fixed size images. 8 | -------------------------------------------------------------------------------- /egs/svhn/README.txt: -------------------------------------------------------------------------------- 1 | 2 | This directory contains example scripts for image classification with the 3 | SVHN (Street View House Numbers) dataset, which is available for free from 4 | http://ufldl.stanford.edu/housenumbers/. 5 | 6 | This demonstrates applying the nnet3 framework to image classification for 7 | fixed size images. 8 | -------------------------------------------------------------------------------- /egs/yesno/s5/local/create_yesno_txt.pl: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | $in_list = $ARGV[0]; 4 | 5 | open IL, $in_list; 6 | 7 | while ($l = ) 8 | { 9 | chomp($l); 10 | $l =~ s/\.wav//; 11 | $trans = $l; 12 | $trans =~ s/0/NO/g; 13 | $trans =~ s/1/YES/g; 14 | $trans =~ s/\_/ /g; 15 | print "$l $trans\n"; 16 | } 17 | -------------------------------------------------------------------------------- /src/feat/test_data/prepare_wav_in_ascii.m: -------------------------------------------------------------------------------- 1 | %convert the 16kHz, lin16, wav to ascii float format 2 | test = wavread('test.wav'); 3 | test = test*32768; 4 | 5 | fo = fopen('test_matlab.ascii','w'); 6 | fprintf(fo,'[',); 7 | for i=1:size(test,1) 8 | fprintf(fo,' %g',test(i)); 9 | end 10 | fprintf(fo,' ]'); 11 | fclose(fo); 12 | -------------------------------------------------------------------------------- /src/lm/test_data/missing_backoffs.arpa: -------------------------------------------------------------------------------- 1 | 2 | \data\ 3 | ngram 1=4 4 | ngram 2=1 5 | ngram 3=2 6 | 7 | \1-grams: 8 | -5.234679 a -3.3 9 | -3.456783 b 10 | 0.0000000 -2.5 11 | -4.333333 12 | 13 | \2-grams: 14 | -1.30490 a -4.2 15 | 16 | \3-grams: 17 | -0.34958 a b 18 | -0.23940 a b 19 | 20 | \end\ 21 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/nnet3/train/chain_objf/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | 3 | # Copyright 2016 Vimal Manohar 4 | # Apache 2.0. 5 | 6 | """ This is a subpackage containing modules for training of 7 | deep neural network acoustic model with chain objective. 8 | """ 9 | 10 | import acoustic_model 11 | 12 | __all__ = ["acoustic_model"] 13 | -------------------------------------------------------------------------------- /egs/rm/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /src/lm/test_data/input.arpa: -------------------------------------------------------------------------------- 1 | 2 | \data\ 3 | ngram 1=4 4 | ngram 2=2 5 | ngram 3=2 6 | 7 | \1-grams: 8 | -5.234679 a -3.3 9 | -3.456783 b 10 | 0.0000000 -2.5 11 | -4.333333 12 | 13 | \2-grams: 14 | -1.45678 a b -3.23 15 | -1.30490 a -4.2 16 | 17 | \3-grams: 18 | -0.34958 a b 19 | -0.23940 a b 20 | 21 | \end\ 22 | -------------------------------------------------------------------------------- /egs/aspire/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/chime1/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/hkust/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --sample-frequency=8000 3 | 4 | --low-freq=64 # typical setup from Frantisek Grezl 5 | --high-freq=3800 6 | --dither=1 7 | 8 | --num-mel-bins=36 # 8kHz so we use 36 bins (@ 8 filters/octave to get closer to 40 filters/16Khz used by IBM) 9 | -------------------------------------------------------------------------------- /egs/reverb/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/sre10/v1/local/dnn/README: -------------------------------------------------------------------------------- 1 | This directory contains DNN scripts based on the nnet2 recipes found in 2 | the ASR examples (e.g., fisher_english). The scripts have been modified 3 | for speaker recognition purposes. Most of the scripts are lightly modified 4 | versions of those appearing in the steps or local directories of 5 | egs/fisher_english. 6 | -------------------------------------------------------------------------------- /egs/swbd/s5b/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --sample-frequency=8000 3 | 4 | --low-freq=64 # typical setup from Frantisek Grezl 5 | --high-freq=3800 6 | --dither=1 7 | 8 | --num-mel-bins=36 # 8kHz so we use 36 bins (@ 8 filters/octave to get closer to 40 filters/16Khz used by IBM) 9 | -------------------------------------------------------------------------------- /egs/swbd/s5c/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --sample-frequency=8000 3 | 4 | --low-freq=64 # typical setup from Frantisek Grezl 5 | --high-freq=3800 6 | --dither=1 7 | 8 | --num-mel-bins=36 # 8kHz so we use 36 bins (@ 8 filters/octave to get closer to 40 filters/16Khz used by IBM) 9 | -------------------------------------------------------------------------------- /egs/an4/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=$(pwd)/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/lre07/v2/local/dnn/README: -------------------------------------------------------------------------------- 1 | This directory contains DNN scripts based on the nnet2 recipes found in 2 | the ASR examples (e.g., fisher_english). The scripts have been modified 3 | for language recognition purposes. Most of the scripts are lightly modified 4 | versions of those appearing in the steps or local directories of 5 | egs/fisher_english. 6 | -------------------------------------------------------------------------------- /egs/swbd/s5c/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/vystadial_cz/s5/common/mfcc.conf: -------------------------------------------------------------------------------- 1 | # --use-energy=false # non default option. False -> Use C0 instead energy 2 | # NUMCEPS in HTK is without C0: there 12 here 13 - default 3 | --low-freq=125 4 | --high-freq=3800 5 | # --htk-compat 6 | # --remove-dc-offset # equivalent ZMEANSOURCE in HTK 7 | # --subtract-mean # not recommended to do it this way 8 | -------------------------------------------------------------------------------- /egs/vystadial_en/s5/common/mfcc.conf: -------------------------------------------------------------------------------- 1 | # --use-energy=false # non default option. False -> Use C0 instead energy 2 | # NUMCEPS in HTK is without C0: there 12 here 13 - default 3 | --low-freq=125 4 | --high-freq=3800 5 | # --htk-compat 6 | # --remove-dc-offset # equivalent ZMEANSOURCE in HTK 7 | # --subtract-mean # not recommended to do it this way 8 | -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/fisher_english/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=$(pwd)/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/babel_multilang/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/multi_en/s5/conf/MSU_single_letter.txt: -------------------------------------------------------------------------------- 1 | A ey 2 | B b iy 3 | C s iy 4 | D d iy 5 | E iy 6 | F eh f 7 | G jh iy 8 | H ey ch 9 | I ay 10 | J jh ey 11 | K k ey 12 | L eh l 13 | M eh m 14 | N eh n 15 | O ow 16 | P p iy 17 | Q k y uw 18 | R aa r 19 | S eh s 20 | T t iy 21 | U y uw 22 | V v iy 23 | W d ah b ax l y uw 24 | X eh k s 25 | Y w ay 26 | Z z iy 27 | -------------------------------------------------------------------------------- /egs/swbd/s5c/local/MSU_single_letter.txt: -------------------------------------------------------------------------------- 1 | A ey 2 | B b iy 3 | C s iy 4 | D d iy 5 | E iy 6 | F eh f 7 | G jh iy 8 | H ey ch 9 | I ay 10 | J jh ey 11 | K k ey 12 | L eh l 13 | M eh m 14 | N eh n 15 | O ow 16 | P p iy 17 | Q k y uw 18 | R aa r 19 | S eh s 20 | T t iy 21 | U y uw 22 | V v iy 23 | W d ah b ax l y uw 24 | X eh k s 25 | Y w ay 26 | Z z iy 27 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/fix_stm.sh: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env bash 2 | 3 | # Fixes the CALLHOME stm files 4 | # Copyright 2014 Gaurav Kumar. Apache 2.0 5 | 6 | data_dir=$1 7 | 8 | cat $data_dir/stm | awk '{$1=substr(tolower($1),0,length($1)-4);print;}' > $data_dir/stm_new 9 | mv $data_dir/stm $data_dir/stm.bak 10 | mv $data_dir/stm_new $data_dir/stm 11 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/conf/MSU_single_letter.txt: -------------------------------------------------------------------------------- 1 | A ey 2 | B b iy 3 | C s iy 4 | D d iy 5 | E iy 6 | F eh f 7 | G jh iy 8 | H ey ch 9 | I ay 10 | J jh ey 11 | K k ey 12 | L eh l 13 | M eh m 14 | N eh n 15 | O ow 16 | P p iy 17 | Q k y uw 18 | R aa r 19 | S eh s 20 | T t iy 21 | U y uw 22 | V v iy 23 | W d ah b ax l y uw 24 | X eh k s 25 | Y w ay 26 | Z z iy 27 | -------------------------------------------------------------------------------- /src/lmbin/Makefile: -------------------------------------------------------------------------------- 1 | 2 | all: 3 | 4 | EXTRA_CXXFLAGS = -Wno-sign-compare 5 | include ../kaldi.mk 6 | 7 | BINFILES = arpa2fst arpa-to-const-arpa 8 | 9 | OBJFILES = 10 | 11 | TESTFILES = 12 | 13 | ADDLIBS = ../lm/kaldi-lm.a ../util/kaldi-util.a \ 14 | ../matrix/kaldi-matrix.a ../base/kaldi-base.a 15 | 16 | include ../makefiles/default_rules.mk 17 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/sprak_prep_lm.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | 4 | 5 | dir=$1 6 | 7 | split -l 50000 $dir/lmtxtfiles $dir/templist_ 8 | 9 | for f in $dir/templist_*; do 10 | cat $f | while read l; do 11 | cat $l; 12 | done > $f.sents; 13 | done 14 | 15 | cat $dir/templist_*.sents > $dir/lmsents 16 | 17 | wait 18 | 19 | rm -f $dir/templist_* 20 | -------------------------------------------------------------------------------- /misc/papers/icassp12_lat/Makefile: -------------------------------------------------------------------------------- 1 | 2 | all: paper.pdf 3 | cp paper.pdf ~/desktop/2012_icassp_lattices.pdf 4 | 5 | paper.pdf: paper.ps 6 | ps2pdf paper.ps paper.pdf 7 | 8 | 9 | paper.ps: paper.dvi 10 | dvips -o paper.ps paper.dvi 11 | 12 | paper.dvi: paper.tex refs.bib 13 | latex paper -o paper.dvi 14 | bibtex paper 15 | 16 | 17 | 18 | 19 | 20 | 21 | -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/local/splits/dev: -------------------------------------------------------------------------------- 1 | ar_4264.sph 2 | ar_4345.sph 3 | ar_4530.sph 4 | ar_4718.sph 5 | ar_4820.sph 6 | ar_4885.sph 7 | ar_4975.sph 8 | ar_5045.sph 9 | ar_5160.sph 10 | ar_5205.sph 11 | ar_5276.sph 12 | ar_5579.sph 13 | ar_5611.sph 14 | ar_5627.sph 15 | ar_5659.sph 16 | ar_5678.sph 17 | ar_5707.sph 18 | ar_5709.sph 19 | ar_5775.sph 20 | ar_5790.sph 21 | -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/local/splits/h5: -------------------------------------------------------------------------------- 1 | ar_4509.sph 2 | ar_4856.sph 3 | ar_5165.sph 4 | ar_5350.sph 5 | ar_5829.sph 6 | ar_6997.sph 7 | ar_7009.sph 8 | ar_7011.sph 9 | ar_7012.sph 10 | ar_7015.sph 11 | ar_7037.sph 12 | ar_7047.sph 13 | ar_7048.sph 14 | ar_7054.sph 15 | ar_7055.sph 16 | ar_7056.sph 17 | ar_7057.sph 18 | ar_7066.sph 19 | ar_7074.sph 20 | ar_7083.sph 21 | -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/local/splits/sup: -------------------------------------------------------------------------------- 1 | ar_4758.sph 2 | ar_4862.sph 3 | ar_5245.sph 4 | ar_5328.sph 5 | ar_5753.sph 6 | ar_5765.sph 7 | ar_5808.sph 8 | ar_5838.sph 9 | ar_7001.sph 10 | ar_7010.sph 11 | ar_7029.sph 12 | ar_7030.sph 13 | ar_7032.sph 14 | ar_7035.sph 15 | ar_7046.sph 16 | ar_7051.sph 17 | ar_7058.sph 18 | ar_7068.sph 19 | ar_7077.sph 20 | ar_7090.sph 21 | -------------------------------------------------------------------------------- /egs/callhome_egyptian/s5/local/splits/test: -------------------------------------------------------------------------------- 1 | ar_4482.sph 2 | ar_4486.sph 3 | ar_4510.sph 4 | ar_4527.sph 5 | ar_4540.sph 6 | ar_4579.sph 7 | ar_4687.sph 8 | ar_4695.sph 9 | ar_4780.sph 10 | ar_4864.sph 11 | ar_5091.sph 12 | ar_5271.sph 13 | ar_5453.sph 14 | ar_5567.sph 15 | ar_5595.sph 16 | ar_5679.sph 17 | ar_5734.sph 18 | ar_5766.sph 19 | ar_5767.sph 20 | ar_5827.sph 21 | -------------------------------------------------------------------------------- /egs/chime1/s5/config.sh: -------------------------------------------------------------------------------- 1 | case "$USER" in 2 | "ac1nmx") 3 | # CHiME Challenge wav root (after unzipping)... 4 | export WAV_ROOT="/data/ac1nmx/data/PCCdata16kHz" 5 | 6 | # Used by the recogniser for storing data/ exp/ mfcc/ etc 7 | export REC_ROOT="." 8 | ;; 9 | *) 10 | echo "Please define WAV_ROOT and REC_ROOT for user $USER" 11 | ;; 12 | esac 13 | 14 | -------------------------------------------------------------------------------- /egs/lre/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/lre07/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/sre08/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/sre10/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/sre10/v2/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/splits/dev: -------------------------------------------------------------------------------- 1 | sp_0897.sph 2 | sp_0968.sph 3 | sp_0981.sph 4 | sp_1062.sph 5 | sp_1292.sph 6 | sp_1411.sph 7 | sp_1413.sph 8 | sp_1552.sph 9 | sp_1554.sph 10 | sp_1805.sph 11 | sp_1808.sph 12 | sp_1882.sph 13 | sp_1930.sph 14 | sp_1947.sph 15 | sp_2037.sph 16 | sp_2054.sph 17 | sp_2057.sph 18 | sp_2107.sph 19 | sp_2109.sph 20 | sp_2144.sph 21 | -------------------------------------------------------------------------------- /egs/bn_music_speech/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/splits/test: -------------------------------------------------------------------------------- 1 | sp_0053.sph 2 | sp_0082.sph 3 | sp_0084.sph 4 | sp_0088.sph 5 | sp_0681.sph 6 | sp_0699.sph 7 | sp_0776.sph 8 | sp_0857.sph 9 | sp_1031.sph 10 | sp_1100.sph 11 | sp_1148.sph 12 | sp_1156.sph 13 | sp_1186.sph 14 | sp_1212.sph 15 | sp_1345.sph 16 | sp_1435.sph 17 | sp_1578.sph 18 | sp_1648.sph 19 | sp_1807.sph 20 | sp_1847.sph 21 | -------------------------------------------------------------------------------- /egs/hkust/README.txt: -------------------------------------------------------------------------------- 1 | About HKUST Mandarin Telephone Speech 2 | 3 | The data below were collected from Human Language Technology Center, HKUST 4 | 5 | LDC2005S15 : http://www.ldc.upenn.edu/Catalog/catalogEntry.jsp?catalogId=LDC2005S15 6 | LDC2005T32 : http://www.ldc.upenn.edu/Catalog/catalogEntry.jsp?catalogId=LDC2005T32 7 | 8 | s5: The experiments here were based on the above corpus 9 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/splits/split_callhome/dev: -------------------------------------------------------------------------------- 1 | sp_0897.sph 2 | sp_0968.sph 3 | sp_0981.sph 4 | sp_1062.sph 5 | sp_1292.sph 6 | sp_1411.sph 7 | sp_1413.sph 8 | sp_1552.sph 9 | sp_1554.sph 10 | sp_1805.sph 11 | sp_1808.sph 12 | sp_1882.sph 13 | sp_1930.sph 14 | sp_1947.sph 15 | sp_2037.sph 16 | sp_2054.sph 17 | sp_2057.sph 18 | sp_2107.sph 19 | sp_2109.sph 20 | sp_2144.sph 21 | -------------------------------------------------------------------------------- /egs/apiai_decode/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/src/path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/fisher_callhome_spanish/s5/local/splits/split_callhome/test: -------------------------------------------------------------------------------- 1 | sp_0053.sph 2 | sp_0082.sph 3 | sp_0084.sph 4 | sp_0088.sph 5 | sp_0681.sph 6 | sp_0699.sph 7 | sp_0776.sph 8 | sp_0857.sph 9 | sp_1031.sph 10 | sp_1100.sph 11 | sp_1148.sph 12 | sp_1156.sph 13 | sp_1186.sph 14 | sp_1212.sph 15 | sp_1345.sph 16 | sp_1435.sph 17 | sp_1578.sph 18 | sp_1648.sph 19 | sp_1807.sph 20 | sp_1847.sph 21 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/nnet3/train/frame_level_objf/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | 3 | # Copyright 2016 Vimal Manohar 4 | # Apache 2.0 5 | 6 | """ This library has classes and methods commonly used for training nnet3 7 | neural networks with frame-level objectives. 8 | """ 9 | 10 | import common 11 | import raw_model 12 | import acoustic_model 13 | 14 | __all__ = ["common", "raw_model", "acoustic_model"] 15 | -------------------------------------------------------------------------------- /tools/extras/install_sctk_patched.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | # A patch for sctk-2.4.0 smooth installation under Cygwin 4 | 5 | os=`uname -a | awk '{printf $NF}'` 6 | 7 | if [ "$os" == "Cygwin" ] 8 | then 9 | cp src/rfilter1/makefile.in src/rfilter1/makefile.in.orig 10 | sed 's/OPTIONS=-DNEED_STRCMP=1/OPTIONS=/g' src/rfilter1/makefile.in > tmpf 11 | mv tmpf src/rfilter1/makefile.in 12 | fi 13 | -------------------------------------------------------------------------------- /egs/chime2/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/cifar/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/fame/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=$(pwd)/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/kaldi_lm:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | . $KALDI_ROOT/tools/env.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/hkust/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/iban/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/complexphones.txt: -------------------------------------------------------------------------------- 1 | & &+ 2 | 0 3 | 3 4 | e 5 | E 6 | i I 7 | o 8 | O 9 | u U 10 | V 11 | W W+ 12 | y Y 13 | @ @- 14 | a 15 | A 16 | aI 17 | n n- 18 | b B 19 | d 20 | D 21 | dZ tS 22 | f 23 | g 24 | h 25 | j ; J 26 | k 27 | l L 28 | m 29 | N ~ 30 | p 31 | r R R3 3- 32 | s z 33 | S x Z 34 | t 35 | T 36 | v 37 | w 38 | -------------------------------------------------------------------------------- /egs/svhn/v1/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/swbd/s5b/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/wsj/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/wsj/s5/utils/filt.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python 2 | 3 | # Apache 2.0 4 | 5 | import sys 6 | 7 | vocab=set() 8 | with open(sys.argv[1]) as vocabfile: 9 | for line in vocabfile: 10 | vocab.add(line.strip()) 11 | 12 | with open(sys.argv[2]) as textfile: 13 | for line in textfile: 14 | print " ".join(map(lambda word: word if word in vocab else '', line.strip().split())) 15 | -------------------------------------------------------------------------------- /egs/aurora4/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/chime4/s5_1ch/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/fisher_swbd/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/hkust/s5/conf/cmu2pinyin: -------------------------------------------------------------------------------- 1 | AA A 2 | AE A 3 | AH A 4 | AO UO 5 | AW U 6 | AY AI 7 | B B 8 | CH CH 9 | D D 10 | DH S I 11 | EH AI 12 | ER E 13 | EY AI 14 | F F 15 | G G 16 | HH H 17 | IH I 18 | IY I 19 | JH ZH 20 | K K 21 | L L 22 | M M 23 | N N 24 | NG N 25 | OW UO 26 | OY UO 27 | P P 28 | R R 29 | S S 30 | SH SH 31 | T T 32 | TH S 33 | UH U 34 | UW U 35 | V W 36 | W W 37 | Y Y 38 | Z Z 39 | ZH X 40 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/tidigits/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/conf/cmu2pinyin: -------------------------------------------------------------------------------- 1 | AA A 2 | AE A 3 | AH A 4 | AO UO 5 | AW U 6 | AY AI 7 | B B 8 | CH CH 9 | D D 10 | DH S I 11 | EH AI 12 | ER E 13 | EY AI 14 | F F 15 | G G 16 | HH H 17 | IH I 18 | IY I 19 | JH ZH 20 | K K 21 | L L 22 | M M 23 | N N 24 | NG N 25 | OW UO 26 | OY UO 27 | P P 28 | R R 29 | S S 30 | SH SH 31 | T T 32 | TH S 33 | UH U 34 | UW U 35 | V W 36 | W W 37 | Y Y 38 | Z Z 39 | ZH X 40 | -------------------------------------------------------------------------------- /egs/sprakbanken_swe/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/thchs30/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | 8 | -------------------------------------------------------------------------------- /egs/yesno/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | 8 | 9 | -------------------------------------------------------------------------------- /src/lm/irstlm.mk: -------------------------------------------------------------------------------- 1 | # Additionnal definitions needed to make with IRSTLM toolkit 2 | 3 | # Assumes IRSTLM includes and libraries have been installed under 4 | # $(SRCDIR)/../lmtoolkit/include/irstlm and $(SRCDIR)/../lmtoolkit/lib/irstlm 5 | 6 | EXTRA_CXXFLAGS = -DHAVE_IRSTLM -I$(SRCDIR)/../lmtoolkit/include -Wno-sign-compare 7 | EXTRA_LDLIBS = $(SRCDIR)/../lmtoolkit/lib/irstlm/x86_64-apple-darwin10.0/libirstlm.a -lz 8 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --use-energy=false # only fbank outputs 3 | --sample-frequency=16000 # AMI is sampled at 16kHz 4 | 5 | #--low-freq=64 # typical setup from Frantisek Grezl 6 | #--high-freq=3800 7 | --dither=1 8 | 9 | --num-mel-bins=40 # 8kHz so we use 15 bins 10 | --htk-compat=true # try to make it compatible with HTK 11 | -------------------------------------------------------------------------------- /egs/swbd/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --use-energy=false # only fbank outputs 3 | --sample-frequency=8000 # Cantonese is sampled at 8kHz 4 | 5 | --low-freq=64 # typical setup from Frantisek Grezl 6 | --high-freq=3800 7 | --dither=1 8 | 9 | --num-mel-bins=15 # 8kHz so we use 15 bins 10 | --htk-compat=true # try to make it compatible with HTK 11 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/nnet3/train/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | # Copyright 2016 Vimal Manohar 3 | # Apache 2.0 4 | 5 | """ This library has classes and methods commonly used for training nnet3 6 | neural networks. 7 | 8 | It has separate submodules for frame-level objectives and chain objective: 9 | frame_level_objf -- For both recurrent and non-recurrent architectures 10 | chain_objf -- LF-MMI objective training 11 | """ 12 | -------------------------------------------------------------------------------- /egs/gale_mandarin/README.txt: -------------------------------------------------------------------------------- 1 | 2 | This recipe is trained on LDC2013S08 (text transcripts from LDC2013T20) which is 3 | Gale Phase 2 Chinese Broadcast News speech: 126 hours of of Mandarin Chinese 4 | broadcast news speech collected in 2006 and 2007 by LDC and HKUST. 5 | 6 | There is no separate test set; we just use 6 hours held out from the training 7 | data, to test on. 8 | 9 | The recipe is in s5/. 10 | 11 | 12 | -------------------------------------------------------------------------------- /egs/babel/s5/conf/glm: -------------------------------------------------------------------------------- 1 | ;; 2 | ;; File: ma970904.glm 3 | ;; Desc: This file contains the transcript filtering rules for the ARPA 4 | ;; Mandarin Hub5-NE Evaluation. 5 | ;; 6 | ;; Date: 970904 7 | ;; - initial creation 8 | ;; 9 | ;; Hesitation mappings 10 | => %HESITATION / [ ] __ [ ] 11 | => %HESITATION / [ ] __ [ ] 12 | => %HESITATION / [ ] __ [ ] 13 | 14 | -------------------------------------------------------------------------------- /egs/babel/s5b/conf/glm: -------------------------------------------------------------------------------- 1 | ;; 2 | ;; File: ma970904.glm 3 | ;; Desc: This file contains the transcript filtering rules for the ARPA 4 | ;; Mandarin Hub5-NE Evaluation. 5 | ;; 6 | ;; Date: 970904 7 | ;; - initial creation 8 | ;; 9 | ;; Hesitation mappings 10 | => %HESITATION / [ ] __ [ ] 11 | => %HESITATION / [ ] __ [ ] 12 | => %HESITATION / [ ] __ [ ] 13 | 14 | -------------------------------------------------------------------------------- /egs/babel/s5c/conf/glm: -------------------------------------------------------------------------------- 1 | ;; 2 | ;; File: ma970904.glm 3 | ;; Desc: This file contains the transcript filtering rules for the ARPA 4 | ;; Mandarin Hub5-NE Evaluation. 5 | ;; 6 | ;; Date: 970904 7 | ;; - initial creation 8 | ;; 9 | ;; Hesitation mappings 10 | => %HESITATION / [ ] __ [ ] 11 | => %HESITATION / [ ] __ [ ] 12 | => %HESITATION / [ ] __ [ ] 13 | 14 | -------------------------------------------------------------------------------- /egs/babel/s5d/conf/glm: -------------------------------------------------------------------------------- 1 | ;; 2 | ;; File: ma970904.glm 3 | ;; Desc: This file contains the transcript filtering rules for the ARPA 4 | ;; Mandarin Hub5-NE Evaluation. 5 | ;; 6 | ;; Date: 970904 7 | ;; - initial creation 8 | ;; 9 | ;; Hesitation mappings 10 | => %HESITATION / [ ] __ [ ] 11 | => %HESITATION / [ ] __ [ ] 12 | => %HESITATION / [ ] __ [ ] 13 | 14 | -------------------------------------------------------------------------------- /egs/hkust/s5/local/wer_hyp_filter: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | @filters=('[NOISE]','[LAUGHTER]','[VOCALIZED-NOISE]','','%HESITATION'); 4 | 5 | foreach $w (@filters) { 6 | $bad{$w} = 1; 7 | } 8 | 9 | while() { 10 | @A = split(" ", $_); 11 | $id = shift @A; 12 | print "$id "; 13 | foreach $a (@A) { 14 | if (!defined $bad{$a}) { 15 | print "$a "; 16 | } 17 | } 18 | print "\n"; 19 | } 20 | -------------------------------------------------------------------------------- /egs/hkust/s5/local/wer_ref_filter: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | @filters=('[NOISE]','[LAUGHTER]','[VOCALIZED-NOISE]','','%HESITATION'); 4 | 5 | foreach $w (@filters) { 6 | $bad{$w} = 1; 7 | } 8 | 9 | while() { 10 | @A = split(" ", $_); 11 | $id = shift @A; 12 | print "$id "; 13 | foreach $a (@A) { 14 | if (!defined $bad{$a}) { 15 | print "$a "; 16 | } 17 | } 18 | print "\n"; 19 | } 20 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/local/wer_hyp_filter: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | @filters=('[NOISE]','[LAUGHTER]','[VOCALIZED-NOISE]','','%HESITATION'); 4 | 5 | foreach $w (@filters) { 6 | $bad{$w} = 1; 7 | } 8 | 9 | while() { 10 | @A = split(" ", $_); 11 | $id = shift @A; 12 | print "$id "; 13 | foreach $a (@A) { 14 | if (!defined $bad{$a}) { 15 | print "$a "; 16 | } 17 | } 18 | print "\n"; 19 | } 20 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/local/wer_ref_filter: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | @filters=('[NOISE]','[LAUGHTER]','[VOCALIZED-NOISE]','','%HESITATION'); 4 | 5 | foreach $w (@filters) { 6 | $bad{$w} = 1; 7 | } 8 | 9 | while() { 10 | @A = split(" ", $_); 11 | $id = shift @A; 12 | print "$id "; 13 | foreach $a (@A) { 14 | if (!defined $bad{$a}) { 15 | print "$a "; 16 | } 17 | } 18 | print "\n"; 19 | } 20 | -------------------------------------------------------------------------------- /egs/timit/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/irstlm/bin/:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /misc/maintenance/check_usage_messages.sh: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env bash 2 | 3 | # run this from the top level of the repo, as 4 | # misc/maintenance/check_usage_messages.sh 5 | 6 | set -e 7 | 8 | cd src 9 | 10 | echo "Any errors reported below must be fixed manually." 11 | grep 'Usage:' *bin/*.cc | \ 12 | perl -ane '@A = split; $path =$A[0]; $A[0] =~ s|.+/(.+).cc:|$1|; if ($A[0] ne $A[2]) { print "$path: $A[0] ne $A[2]\n"; } ' 13 | 14 | -------------------------------------------------------------------------------- /src/kws/Makefile: -------------------------------------------------------------------------------- 1 | 2 | all: 3 | 4 | include ../kaldi.mk 5 | 6 | EXTRA_CXXFLAGS += -Wno-sign-compare 7 | 8 | 9 | OBJFILES = kws-functions.o kws-functions2.o kws-scoring.o 10 | LIBNAME = kaldi-kws 11 | 12 | ADDLIBS = ../lat/kaldi-lat.a ../hmm/kaldi-hmm.a ../tree/kaldi-tree.a \ 13 | ../util/kaldi-util.a \ 14 | ../matrix/kaldi-matrix.a ../base/kaldi-base.a 15 | 16 | 17 | include ../makefiles/default_rules.mk 18 | -------------------------------------------------------------------------------- /egs/farsdat/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/irstlm/bin/:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/lre07/v2/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=$(cd ../../..; pwd) 2 | export PATH=$PWD/utils/:$KALDI_ROOT/src/bin:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/src/fstbin/:$KALDI_ROOT/src/gmmbin/:$KALDI_ROOT/src/featbin/:$KALDI_ROOT/src/lmbin/:$KALDI_ROOT/src/sgmm2bin/:$KALDI_ROOT/src/fgmmbin/:$KALDI_ROOT/src/latbin/:$KALDI_ROOT/src/nnetbin:$KALDI_ROOT/src/nnet2bin:$KALDI_ROOT/src/ivectorbin:$KALDI_ROOT/tools/sph2pipe_v2.5:$PWD:$PATH 3 | export LC_ALL=C 4 | -------------------------------------------------------------------------------- /egs/tedlium/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH:$KALDI_ROOT/tools/sph2pipe_v2.5 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /src/lm/test_data/unused_backoffs.arpa: -------------------------------------------------------------------------------- 1 | 2 | \data\ 3 | ngram 1=4 4 | ngram 2=2 5 | ngram 3=2 6 | ngram 4=2 7 | 8 | \1-grams: 9 | -5.234679 a -3.3 10 | -3.456783 b 11 | 0.0000000 -2.5 12 | -4.333333 13 | 14 | \2-grams: 15 | -1.45678 a b -3.23 16 | -1.30490 a -4.2 17 | 18 | \3-grams: 19 | -0.34958 a b 20 | -0.23940 a b 21 | 22 | \4-grams: 23 | -0.01888 a b b 24 | -0.03333 b b b 25 | 26 | \end\ 27 | -------------------------------------------------------------------------------- /egs/librispeech/README.txt: -------------------------------------------------------------------------------- 1 | 2 | The LibriSpeech corpus is a large (1000 hour) corpus of English read speech 3 | derived from audiobooks in the LibriVox project, sampled at 16kHz. The 4 | accents are various and not marked, but the majority are US English. It is 5 | available for download for free at http://www.openslr.org/12/. It was prepared 6 | as a speech recognition corpus by Vassil Panayotov. 7 | 8 | The recipe is in s5/ 9 | 10 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH:$KALDI_ROOT/tools/sph2pipe_v2.5 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/babel/s5d/local/make_wordlist.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | echo "$0 $@" # Print the command line for logging 4 | 5 | [ -f ./path.sh ] && . ./path.sh; # source the path. 6 | . parse_options.sh || exit 1; 7 | 8 | transcriptions=$1 9 | wordlist=$2 10 | 11 | ( 12 | find $transcriptions -name "*.txt" | xargs egrep -vx '\[[0-9.]+\]' |cut -f 2- -d ':' | sed 's/ /\n/g' 13 | ) | sort -u | grep -v -E '.*\*.*|<.*>|\(\(\)\)|^-.*|.*-$' > $wordlist 14 | 15 | -------------------------------------------------------------------------------- /egs/csj/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | --window-type=hamming # disable Dans window, use the standard 2 | --sample-frequency=16000 3 | --use-energy=false # only fbank outputs 4 | 5 | --low-freq=64 # typical setup from Frantisek Grezl 6 | --high-freq=8000 7 | --dither=1 8 | 9 | --num-mel-bins=40 # 16kHz so we use 40 bins (@ 8 filters/octave to get closer to 40 filters/16Khz used by IBM) 10 | #--htk-compat=true # try to make it compatible with HTK -------------------------------------------------------------------------------- /egs/mini_librispeech/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 3 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 4 | . $KALDI_ROOT/tools/config/common_path.sh 5 | export LC_ALL=C 6 | 7 | # For now, don't include any of the optional dependenices of the main 8 | # librispeech recipe 9 | -------------------------------------------------------------------------------- /egs/vystadial_cz/online_demo/run_live-demo.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | # source the settings 4 | . path.sh 5 | 6 | batch_size=4560 7 | beam=12.0 8 | latbeam=6.0 9 | max_active=2000 10 | 11 | # cgdb -q -x .gdbinit_faster --args python \ 12 | python \ 13 | live-demo.py $batch_size $WST \ 14 | --verbose=0 --lat-lm-scale=15 --config=$MFCC \ 15 | --beam=$beam --lattice-beam=$latbeam --max-active=$max_active \ 16 | $AM $HCLG `cat $SILENCE` $MAT 17 | -------------------------------------------------------------------------------- /egs/yesno/README.txt: -------------------------------------------------------------------------------- 1 | 2 | 3 | The "yesno" corpus is a very small dataset of recordings of one individual 4 | saying yes or no multiple times per recording, in Hebrew. It is available from 5 | http://www.openslr.org/1. 6 | It is mainly included here as an easy way to test out the Kaldi scripts. 7 | 8 | The test set is perfectly recognized at the monophone stage, so the dataset is 9 | not exactly challenging. 10 | 11 | The scripts are in s5/. 12 | 13 | -------------------------------------------------------------------------------- /egs/librispeech/s5/local/run_nnet2_clean_100.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | . utils/parse_options.sh 4 | . ./cmd.sh 5 | 6 | # This shows what you can potentially run; you'd probably want to pick and choose. 7 | 8 | use_gpu=true 9 | 10 | if $use_gpu; then 11 | local/nnet2/run_5c_clean_100.sh --use-gpu true # this is on top of fMLLR features. 12 | else 13 | local/nnet2/run_5c_clean_100.sh --use-gpu false # this is on top of fMLLR features. 14 | fi 15 | 16 | -------------------------------------------------------------------------------- /egs/librispeech/s5/local/run_nnet2_clean_460.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | . utils/parse_options.sh 4 | . ./cmd.sh 5 | 6 | # This shows what you can potentially run; you'd probably want to pick and choose. 7 | 8 | use_gpu=true 9 | 10 | if $use_gpu; then 11 | local/nnet2/run_5c_clean_460.sh --use-gpu true # this is on top of fMLLR features. 12 | else 13 | local/nnet2/run_5c_clean_460.sh --use-gpu false # this is on top of fMLLR features. 14 | fi 15 | 16 | -------------------------------------------------------------------------------- /egs/aurora4/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --window-type=hamming # disable Dans window, use the standard 3 | --use-energy=false # only fbank outputs 4 | --sample-frequency=16000 # Cantonese is sampled at 8kHz 5 | 6 | --low-freq=64 # typical setup from Frantisek Grezl 7 | --high-freq=8000 8 | --dither=1 9 | 10 | --num-mel-bins=40 # 8kHz so we use 15 bins 11 | --htk-compat=true # try to make it compatible with HTK 12 | -------------------------------------------------------------------------------- /egs/chime2/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --window-type=hamming # disable Dans window, use the standard 3 | --use-energy=false # only fbank outputs 4 | --sample-frequency=16000 # Cantonese is sampled at 8kHz 5 | 6 | --low-freq=64 # typical setup from Frantisek Grezl 7 | --high-freq=8000 8 | --dither=1 9 | 10 | --num-mel-bins=40 # 8kHz so we use 15 bins 11 | --htk-compat=true # try to make it compatible with HTK 12 | -------------------------------------------------------------------------------- /egs/chime3/s5/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --window-type=hamming # disable Dans window, use the standard 3 | --use-energy=false # only fbank outputs 4 | --sample-frequency=16000 # Cantonese is sampled at 8kHz 5 | 6 | --low-freq=64 # typical setup from Frantisek Grezl 7 | --high-freq=8000 8 | --dither=1 9 | 10 | --num-mel-bins=40 # 8kHz so we use 15 bins 11 | --htk-compat=true # try to make it compatible with HTK 12 | -------------------------------------------------------------------------------- /egs/chime3/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/tools/irstlm/bin/:$KALDI_ROOT/tools/kaldi_lm/:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export LC_ALL=C 7 | -------------------------------------------------------------------------------- /egs/yesno/s5/local/prepare_dict.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | mkdir -p data/local/dict 4 | 5 | cp input/lexicon_nosil.txt data/local/dict/lexicon_words.txt 6 | 7 | cp input/lexicon.txt data/local/dict/lexicon.txt 8 | 9 | cat input/phones.txt | grep -v SIL > data/local/dict/nonsilence_phones.txt 10 | 11 | echo "SIL" > data/local/dict/silence_phones.txt 12 | 13 | echo "SIL" > data/local/dict/optional_silence.txt 14 | 15 | echo "Dictionary preparation succeeded" 16 | -------------------------------------------------------------------------------- /tools/extras/mikolov_rnnlm.patch: -------------------------------------------------------------------------------- 1 | --- rnnlmlib.h 2015-10-14 17:57:52.315280379 -0400 2 | +++ rnnlmlib.h 2015-10-14 17:58:03.723969289 -0400 3 | @@ -9,7 +9,7 @@ 4 | #ifndef _RNNLMLIB_H_ 5 | #define _RNNLMLIB_H_ 6 | 7 | -#define MAX_STRING 100 8 | +#define MAX_STRING 300 9 | 10 | typedef double real; // doubles for NN weights 11 | typedef double direct_t; // doubles for ME weights; TODO: check why floats are not enough for RNNME (convergence problems) 12 | -------------------------------------------------------------------------------- /egs/babel/s5/local/dict/reverse_dict.pl: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | # Used in conjunction with get_rules.pl 4 | # example input line: XANTHE Z AE1 N DH 5 | # example output line: EHTNAX DH N AE1 Z 6 | 7 | while(<>){ 8 | @A = split(" ", $_); 9 | $word = shift @A; 10 | $word = join("", reverse(split("", $word))); # Reverse letters of word. 11 | @A = reverse(@A); # Reverse phones in pron. 12 | unshift @A, $word; 13 | print join(" ", @A) . "\n"; 14 | } 15 | -------------------------------------------------------------------------------- /egs/babel/s5d/RUN_UNICODE_SYSTEM: -------------------------------------------------------------------------------- 1 | ./run-1-main-unicode.sh --unicode-lexicon true --morfessor true --tri5-only true 2 | 3 | # For tri5 4 | ./run-4-anydecode.sh --fast-path false --tri5-only true --skip-kws true (for tri5 only) 5 | 6 | # For lstm 7 | ./run-4-anydecode.sh --fast-path false --tri5-only true --skip-kws true --data-only true 8 | ./local/nnet3/run_lstm.sh 9 | ./run-4-anydecode.sh --nnet3-model nnet3/lstm_sp --is-rnn true --dir dev10h.pem --skip-kws true 10 | -------------------------------------------------------------------------------- /egs/chime4/s5_1ch/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --window-type=hamming # disable Dans window, use the standard 3 | --use-energy=false # only fbank outputs 4 | --sample-frequency=16000 # Cantonese is sampled at 8kHz 5 | 6 | --low-freq=64 # typical setup from Frantisek Grezl 7 | --high-freq=8000 8 | --dither=1 9 | 10 | --num-mel-bins=40 # 8kHz so we use 15 bins 11 | --htk-compat=true # try to make it compatible with HTK 12 | -------------------------------------------------------------------------------- /egs/chime4/s5_2ch/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --window-type=hamming # disable Dans window, use the standard 3 | --use-energy=false # only fbank outputs 4 | --sample-frequency=16000 # Cantonese is sampled at 8kHz 5 | 6 | --low-freq=64 # typical setup from Frantisek Grezl 7 | --high-freq=8000 8 | --dither=1 9 | 10 | --num-mel-bins=40 # 8kHz so we use 15 bins 11 | --htk-compat=true # try to make it compatible with HTK 12 | -------------------------------------------------------------------------------- /egs/chime4/s5_6ch/conf/fbank.conf: -------------------------------------------------------------------------------- 1 | # No non-default options for now. 2 | --window-type=hamming # disable Dans window, use the standard 3 | --use-energy=false # only fbank outputs 4 | --sample-frequency=16000 # Cantonese is sampled at 8kHz 5 | 6 | --low-freq=64 # typical setup from Frantisek Grezl 7 | --high-freq=8000 8 | --dither=1 9 | 10 | --num-mel-bins=40 # 8kHz so we use 15 bins 11 | --htk-compat=true # try to make it compatible with HTK 12 | -------------------------------------------------------------------------------- /egs/farsdat/s5/conf/dev_spk.list: -------------------------------------------------------------------------------- 1 | 009 2 | 018 3 | 036 4 | 046 5 | 049 6 | 063 7 | 080 8 | 098 9 | 103 10 | 113 11 | 115 12 | 118 13 | 135 14 | 144 15 | 149 16 | 150 17 | 159 18 | 162 19 | 168 20 | 169 21 | 190 22 | 206 23 | 209 24 | 214 25 | 222 26 | 226 27 | 239 28 | 254 29 | 255 30 | 259 31 | 263 32 | 270 33 | 271 34 | 272 35 | 276 36 | 277 37 | 278 38 | 281 39 | 282 40 | 284 41 | 285 42 | 286 43 | 287 44 | 289 45 | 290 46 | 291 47 | 292 48 | 294 49 | 296 50 | 299 51 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/local/test_list: -------------------------------------------------------------------------------- 1 | ALAM_WITHEVENT_ARB_20070116_205800 2 | ALAM_WITHEVENT_ARB_20070130_205800 3 | ALAM_WITHEVENT_ARB_20070206_205801 4 | ALAM_WITHEVENT_ARB_20070213_205800 5 | ALAM_WITHEVENT_ARB_20070227_205800 6 | ALAM_WITHEVENT_ARB_20070306_205800 7 | ALAM_WITHEVENT_ARB_20070313_205800 8 | ARABIYA_FROMIRAQ_ARB_20070216_175800 9 | ARABIYA_FROMIRAQ_ARB_20070223_175801 10 | ARABIYA_FROMIRAQ_ARB_20070302_175801 11 | ARABIYA_FROMIRAQ_ARB_20070309_175800 12 | -------------------------------------------------------------------------------- /egs/wsj/s5/local/dict/reverse_dict.pl: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | # Used in conjunction with get_rules.pl 4 | # example input line: XANTHE Z AE1 N DH 5 | # example output line: EHTNAX DH N AE1 Z 6 | 7 | while(<>){ 8 | @A = split(" ", $_); 9 | $word = shift @A; 10 | $word = join("", reverse(split("", $word))); # Reverse letters of word. 11 | @A = reverse(@A); # Reverse phones in pron. 12 | unshift @A, $word; 13 | print join(" ", @A) . "\n"; 14 | } 15 | -------------------------------------------------------------------------------- /egs/aurora4/s5/local/dict/reverse_dict.pl: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | # Used in conjunction with get_rules.pl 4 | # example input line: XANTHE Z AE1 N DH 5 | # example output line: EHTNAX DH N AE1 Z 6 | 7 | while(<>){ 8 | @A = split(" ", $_); 9 | $word = shift @A; 10 | $word = join("", reverse(split("", $word))); # Reverse letters of word. 11 | @A = reverse(@A); # Reverse phones in pron. 12 | unshift @A, $word; 13 | print join(" ", @A) . "\n"; 14 | } 15 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/local/test_list: -------------------------------------------------------------------------------- 1 | ALAM_WITHEVENT_ARB_20070116_205800 2 | ALAM_WITHEVENT_ARB_20070130_205800 3 | ALAM_WITHEVENT_ARB_20070206_205801 4 | ALAM_WITHEVENT_ARB_20070213_205800 5 | ALAM_WITHEVENT_ARB_20070227_205800 6 | ALAM_WITHEVENT_ARB_20070306_205800 7 | ALAM_WITHEVENT_ARB_20070313_205800 8 | ARABIYA_FROMIRAQ_ARB_20070216_175800 9 | ARABIYA_FROMIRAQ_ARB_20070223_175801 10 | ARABIYA_FROMIRAQ_ARB_20070302_175801 11 | ARABIYA_FROMIRAQ_ARB_20070309_175800 12 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/dict/reverse_dict.pl: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env perl 2 | 3 | # Used in conjunction with get_rules.pl 4 | # example input line: XANTHE Z AE1 N DH 5 | # example output line: EHTNAX DH N AE1 Z 6 | 7 | while(<>){ 8 | @A = split(" ", $_); 9 | $word = shift @A; 10 | $word = join("", reverse(split("", $word))); # Reverse letters of word. 11 | @A = reverse(@A); # Reverse phones in pron. 12 | unshift @A, $word; 13 | print join(" ", @A) . "\n"; 14 | } 15 | -------------------------------------------------------------------------------- /src/hmm/Makefile: -------------------------------------------------------------------------------- 1 | all: 2 | 3 | 4 | include ../kaldi.mk 5 | 6 | TESTFILES = hmm-topology-test hmm-utils-test transition-model-test posterior-test 7 | 8 | OBJFILES = hmm-topology.o transition-model.o hmm-utils.o tree-accu.o \ 9 | posterior.o hmm-test-utils.o 10 | 11 | LIBNAME = kaldi-hmm 12 | ADDLIBS = ../tree/kaldi-tree.a ../util/kaldi-util.a \ 13 | ../matrix/kaldi-matrix.a ../base/kaldi-base.a 14 | 15 | include ../makefiles/default_rules.mk 16 | 17 | -------------------------------------------------------------------------------- /egs/chime1/s5/conf/queue_usfd.conf: -------------------------------------------------------------------------------- 1 | command qsub -v PATH -j y 2 | option mem=* -l mem=$0,rmem=$0 3 | option mem=0 # Do not add anything to qsub_opts 4 | option rmem=* -l rmem=$0 5 | option rmem=0 # Do not add anything to qsub_opts 6 | option num_threads=* -pe openmp $0 7 | option num_threads=1 # Do not add anything to qsub_opts 8 | option max_jobs_run=* -tc $0 9 | option time=* -l h_rt=$0 10 | default gpu=0 11 | option gpu=0 12 | option gpu=* -l gpu=$0 -P gpu 13 | 14 | -------------------------------------------------------------------------------- /egs/swbd/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | #export KALDI_ROOT=/home/dpovey/kaldi-trunk-test 4 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 5 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 6 | . $KALDI_ROOT/tools/config/common_path.sh 7 | export LC_ALL=C 8 | export MKL_NUM_THREADS=16 9 | -------------------------------------------------------------------------------- /egs/wsj/s5/steps/libs/nnet3/__init__.py: -------------------------------------------------------------------------------- 1 | 2 | 3 | # Copyright 2016 Johns Hopkins University (Dan Povey) 4 | # 2016 Vimal Manohar 5 | # 2016 Vijayaditya Peddinti 6 | # 2016 Yiming Wang 7 | # Apache 2.0. 8 | 9 | 10 | # This module has the python functions which facilitate the use of nnet3 toolkit 11 | # It has two sub-modules 12 | # xconfig : Library for parsing high level description of neural networks 13 | # train : Library for training scripts 14 | -------------------------------------------------------------------------------- /egs/babel/s5/conf/common_vars.sh: -------------------------------------------------------------------------------- 1 | #keyword search default 2 | glmFile=conf/glm 3 | duptime=0.5 4 | case_insensitive=false 5 | # Lexicon and Language Model parameters 6 | oovSymbol="" 7 | lexiconFlags="-oov " 8 | boost_sil=1.5 # note from Dan: I expect 1.0 might be better (equivalent to not 9 | # having the option)... should test. 10 | cer=0 11 | 12 | [ -f ./path.sh ] && . ./path.sh; # source the path. 13 | [ -f ./cmd.sh ] && . ./cmd.sh; # source train and decode cmds. 14 | -------------------------------------------------------------------------------- /egs/babel/s5b/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | . /export/babel/data/software/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/sph2pipe_v2.5/:$KALDI_ROOT/src/bin:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/src/fstbin/:$KALDI_ROOT/src/gmmbin/:$KALDI_ROOT/src/featbin/:$KALDI_ROOT/src/lmbin/:$KALDI_ROOT/src/sgmmbin/:$KALDI_ROOT/src/sgmm2bin/:$KALDI_ROOT/src/fgmmbin/:$KALDI_ROOT/src/latbin/:$KALDI_ROOT/src/nnetbin:$KALDI_ROOT/src/nnet2bin/:$KALDI_ROOT/src/kwsbin:$PWD:$PATH 4 | export LC_ALL=C 5 | -------------------------------------------------------------------------------- /egs/babel/s5c/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | . /export/babel/data/software/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/sph2pipe_v2.5/:$KALDI_ROOT/src/bin:$KALDI_ROOT/tools/openfst/bin:$KALDI_ROOT/src/fstbin/:$KALDI_ROOT/src/gmmbin/:$KALDI_ROOT/src/featbin/:$KALDI_ROOT/src/lmbin/:$KALDI_ROOT/src/sgmmbin/:$KALDI_ROOT/src/sgmm2bin/:$KALDI_ROOT/src/fgmmbin/:$KALDI_ROOT/src/latbin/:$KALDI_ROOT/src/nnetbin:$KALDI_ROOT/src/nnet2bin/:$KALDI_ROOT/src/kwsbin:$PWD:$PATH 4 | export LC_ALL=C 5 | -------------------------------------------------------------------------------- /egs/lre/README.txt: -------------------------------------------------------------------------------- 1 | This directory (lre) will contain example scripts for language identification. 2 | Development is just beginning so this recipe is incomplete. 3 | The following LDC corpora are required: 4 | 5 | SRE 2008 training set: LDC2011S05 6 | 7 | This list will be updated as scripts for system development and testing 8 | (which will require additional data sources) are created. 9 | 10 | The subdirectories "v1" and so on are different versions of the recipe. 11 | 12 | -------------------------------------------------------------------------------- /egs/tedlium/s5/local/chain/README: -------------------------------------------------------------------------------- 1 | These are the instructions to reproduce the TEDLIUM models described in 2 | "Purely sequence-trained neural networks for ASR based on lattice-free 3 | MMI", by Povey et al. 4 | 5 | First run: 6 | 7 | ./run.sh 8 | 9 | until the end of stage 7. (local/nnet/run_dnn.sh can be skipped.) 10 | 11 | Then run: 12 | 13 | local/chain/run_tdnn.sh 14 | 15 | to see results for a generic chain model. See the script's header 16 | comments to see other options, and their results. -------------------------------------------------------------------------------- /egs/tidigits/README.txt: -------------------------------------------------------------------------------- 1 | 2 | The TIDIGITS database consists of men, women, boys and girls reading 3 | digit strings of varying lengths; these are sampled at 20 kHz. 4 | It's available from the LDC as catalog number LDC93S10. 5 | 6 | The subdirectory s5 consists of "s5-style" (i.e. new, at the current 7 | time of writing) scripts for training and testing. Note: unlike the 8 | other s5 scripts we don't include word-boundary information, since it 9 | wouldn't add anything useful. 10 | 11 | -------------------------------------------------------------------------------- /src/lm/Makefile: -------------------------------------------------------------------------------- 1 | EXTRA_CXXFLAGS = -Wno-sign-compare 2 | 3 | all: 4 | 5 | include ../kaldi.mk 6 | 7 | TESTFILES = arpa-file-parser-test arpa-lm-compiler-test 8 | 9 | OBJFILES = arpa-file-parser.o arpa-lm-compiler.o const-arpa-lm.o \ 10 | kaldi-rnnlm.o mikolov-rnnlm-lib.o 11 | 12 | LIBNAME = kaldi-lm 13 | 14 | ADDLIBS = ../fstext/kaldi-fstext.a ../util/kaldi-util.a \ 15 | ../matrix/kaldi-matrix.a \ 16 | ../base/kaldi-base.a 17 | 18 | include ../makefiles/default_rules.mk 19 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/queue_jsalt.conf: -------------------------------------------------------------------------------- 1 | # Origin at : http://wiki.clsp.jhu.edu/view/Ws15_AWS_Kluster_Rules 2 | # configuration for the AWS cluster for WS'15. 3 | command qsub -v PATH -cwd -S /bin/bash -j y -l arch=*64* 4 | option mem=* -l mem_free=$0,ram_free=$0 5 | option mem=0 # Do not add anything to qsub_opts 6 | option num_threads=* -pe smp $0 7 | option num_threads=1 # Do not add anything to qsub_opts 8 | option max_jobs_run=* -tc $0 9 | default gpu=0 10 | option gpu=0 11 | option gpu=1 -q gpu.q 12 | -------------------------------------------------------------------------------- /egs/rm/s5/conf/decode_dnn.config: -------------------------------------------------------------------------------- 1 | # In RM, the optimal decode LMWT is in range 2..5, which is different from usual 10..15 2 | # (it is caused by using simple rule-based LM, instead of n-gram LM), 3 | scoring_opts="--min-lmwt 2 --max-lmwt 10" 4 | # Still, it is better to use --acwt 0.1, both for decoding and sMBR, 5 | acwt=0.1 6 | # For this small task we can afford to have large beams, 7 | beam=30.0 # beam for decoding. Was 13.0 in the scripts. 8 | lattice_beam=18.0 # this has most effect on size of the lattices. 9 | -------------------------------------------------------------------------------- /egs/gale_mandarin/s5/local/gale_segment.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python 2 | #coding:utf-8 3 | #!/usr/bin/env python 4 | import sys 5 | from mmseg import seg_txt 6 | for line in sys.stdin: 7 | blks = str.split(line) 8 | out_line = "" 9 | for i in range(0, len(blks)): 10 | if blks[i] == "[VOCALIZED-NOISE]" or blks[i] == "[NOISE]" or blks[i] == "[LAUGHTER]": 11 | out_line += " " + blks[i] 12 | continue 13 | for j in seg_txt(blks[i]): 14 | out_line += " " + j 15 | print out_line 16 | -------------------------------------------------------------------------------- /egs/csj/s5/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export PATH=$PATH:/usr/local/cuda/bin 7 | export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/cuda/lib64:/usr/local/lib:/usr/local/lib64:/usr/local/cuda/bin/nvcc 8 | 9 | export LC_ALL=C 10 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/path.sh: -------------------------------------------------------------------------------- 1 | export KALDI_ROOT=`pwd`/../../.. 2 | [ -f $KALDI_ROOT/tools/env.sh ] && . $KALDI_ROOT/tools/env.sh 3 | export PATH=$PWD/utils/:$KALDI_ROOT/tools/openfst/bin:$PWD:$PATH:$KALDI_ROOT/tools/sph2pipe_v2.5 4 | [ ! -f $KALDI_ROOT/tools/config/common_path.sh ] && echo >&2 "The standard file $KALDI_ROOT/tools/config/common_path.sh is not present -> Exit!" && exit 1 5 | . $KALDI_ROOT/tools/config/common_path.sh 6 | export PATH=$PATH:/home/vmanoha1/kaldi-asr-diarization/src/segmenterbin 7 | export LC_ALL=C 8 | -------------------------------------------------------------------------------- /egs/hkust/s5/local/hkust_segment.py: -------------------------------------------------------------------------------- 1 | #!/usr/bin/env python 2 | #coding:utf-8 3 | 4 | import sys 5 | from __future__ import print_function 6 | from mmseg import seg_txt 7 | for line in sys.stdin: 8 | blks = str.split(line) 9 | out_line = blks[0] 10 | for i in range(1, len(blks)): 11 | if blks[i] == "[VOCALIZED-NOISE]" or blks[i] == "[NOISE]" or blks[i] == "[LAUGHTER]": 12 | out_line += " " + blks[i] 13 | continue 14 | for j in seg_txt(blks[i]): 15 | out_line += " " + j 16 | print(out_line) 17 | -------------------------------------------------------------------------------- /egs/sprakbanken/s5/local/generate_results_file.sh: -------------------------------------------------------------------------------- 1 | 2 | echo "GMM-based systems" 3 | for x in exp/*/decode*;do 4 | [ -d $x ] && grep WER $x/wer_* | utils/best_wer.sh; 5 | done 6 | 7 | echo "nnet3 xent systems" 8 | for x in exp/nnet3/tdnn*/decode* exp/nnet3/lstm*/decode* ;do 9 | [ -d $x ] && grep WER $x/wer_* | utils/best_wer.sh; 10 | done 11 | 12 | echo "Nnet3 chain systems" 13 | for x in exp/chain/tdnn*/decode* exp/chain/lstm*/decode*;do 14 | [ -d $x ] && grep WER $x/wer_* | utils/best_wer.sh; 15 | done 16 | 17 | -------------------------------------------------------------------------------- /egs/an4/s5/RESULTS: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | for x in exp/*/decode*; do [ -d $x ] && [[ $x =~ "$1" ]] && grep WER $x/wer_* | utils/best_wer.sh; done 3 | exit 0 4 | 5 | %WER 10.61 [ 82 / 773, 4 ins, 10 del, 68 sub ] exp/mono/decode/wer_10_0.5 6 | %WER 10.48 [ 81 / 773, 5 ins, 7 del, 69 sub ] exp/tri1/decode/wer_19_0.5 7 | %WER 11.38 [ 88 / 773, 17 ins, 3 del, 68 sub ] exp/tri2/decode/wer_18_0.5 8 | %WER 5.95 [ 46 / 773, 3 ins, 3 del, 40 sub ] exp/tri3/decode/wer_20_1.0 9 | %WER 9.06 [ 70 / 773, 6 ins, 4 del, 60 sub ] exp/tri3/decode.si/wer_20_1.0 10 | -------------------------------------------------------------------------------- /egs/ami/s5/conf/queue_no_k20.conf: -------------------------------------------------------------------------------- 1 | # Default configuration 2 | command qsub -v PATH -cwd -S /bin/bash -j y -l arch=*64* 3 | option mem=* -l mem_free=$0,ram_free=$0 4 | option mem=0 # Do not add anything to qsub_opts 5 | option num_threads=* -pe smp $0 6 | option num_threads=1 # Do not add anything to qsub_opts 7 | option max_jobs_run=* -tc $0 8 | default gpu=0 9 | option gpu=0 -q all.q 10 | option gpu=* -l gpu=$0 -q g.q 11 | default allow_k20=true 12 | option allow_k20=true 13 | option allow_k20=false -l 'hostname=!g01*&!g02*&!b06*' 14 | -------------------------------------------------------------------------------- /egs/tedlium/s5/conf/no_k20.conf: -------------------------------------------------------------------------------- 1 | # Default configuration 2 | command qsub -v PATH -cwd -S /bin/bash -j y -l arch=*64* 3 | option mem=* -l mem_free=$0,ram_free=$0 4 | option mem=0 # Do not add anything to qsub_opts 5 | option num_threads=* -pe smp $0 6 | option num_threads=1 # Do not add anything to qsub_opts 7 | option max_jobs_run=* -tc $0 8 | default gpu=0 9 | option gpu=0 -q all.q 10 | option gpu=* -l gpu=$0 -q g.q 11 | default allow_k20=true 12 | option allow_k20=true 13 | option allow_k20=false -l 'hostname=!g01*&!g02*&!b06*' 14 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2/conf/no_k20.conf: -------------------------------------------------------------------------------- 1 | # Default configuration 2 | command qsub -v PATH -cwd -S /bin/bash -j y -l arch=*64* 3 | option mem=* -l mem_free=$0,ram_free=$0 4 | option mem=0 # Do not add anything to qsub_opts 5 | option num_threads=* -pe smp $0 6 | option num_threads=1 # Do not add anything to qsub_opts 7 | option max_jobs_run=* -tc $0 8 | default gpu=0 9 | option gpu=0 -q all.q 10 | option gpu=* -l gpu=$0 -q g.q 11 | default allow_k20=true 12 | option allow_k20=true 13 | option allow_k20=false -l 'hostname=!g01*&!g02*&!b06*' 14 | -------------------------------------------------------------------------------- /egs/vystadial_cz/s5/local/create_sample.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | # example usage: 3 | # ./local/create_sample.sh /ha/projects/vystadial/data/asr/en/voip/ Results/vystadial-sample/ test 100 4 | # note that it suppose there are only *.wav and *.wav.trn and the 5 | # the n is the numbero of files in the directory 6 | 7 | src=$1 8 | tgt=$2 9 | typ=$3 # dev/test/train 10 | n=$4 11 | 12 | src_dir=$src/$typ 13 | tgt_dir=$tgt/$typ 14 | mkdir -p $tgt_dir 15 | ls $src_dir | head -n $n \ 16 | | while read f ; do 17 | cp $src_dir/$f $tgt_dir 18 | done 19 | -------------------------------------------------------------------------------- /egs/vystadial_en/s5/local/create_sample.sh: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | # example usage: 3 | # ./local/create_sample.sh /ha/projects/vystadial/data/asr/en/voip/ Results/vystadial-sample/ test 100 4 | # note that it suppose there are only *.wav and *.wav.trn and the 5 | # the n is the numbero of files in the directory 6 | 7 | src=$1 8 | tgt=$2 9 | typ=$3 # dev/test/train 10 | n=$4 11 | 12 | src_dir=$src/$typ 13 | tgt_dir=$tgt/$typ 14 | mkdir -p $tgt_dir 15 | ls $src_dir | head -n $n \ 16 | | while read f ; do 17 | cp $src_dir/$f $tgt_dir 18 | done 19 | -------------------------------------------------------------------------------- /egs/aspire/s5/conf/queue_no_k20.conf: -------------------------------------------------------------------------------- 1 | # Default configuration 2 | command qsub -v PATH -cwd -S /bin/bash -j y -l arch=*64* 3 | option mem=* -l mem_free=$0,ram_free=$0 4 | option mem=0 # Do not add anything to qsub_opts 5 | option num_threads=* -pe smp $0 6 | option num_threads=1 # Do not add anything to qsub_opts 7 | option max_jobs_run=* -tc $0 8 | default gpu=0 9 | option gpu=0 -q all.q 10 | option gpu=* -l gpu=$0 -q g.q 11 | default allow_k20=true 12 | option allow_k20=true 13 | option allow_k20=false -l 'hostname=!g01*&!g02*&!b06*' 14 | -------------------------------------------------------------------------------- /egs/tedlium/s5_r2_wsj/conf/no_k20.conf: -------------------------------------------------------------------------------- 1 | # Default configuration 2 | command qsub -v PATH -cwd -S /bin/bash -j y -l arch=*64* 3 | option mem=* -l mem_free=$0,ram_free=$0 4 | option mem=0 # Do not add anything to qsub_opts 5 | option num_threads=* -pe smp $0 6 | option num_threads=1 # Do not add anything to qsub_opts 7 | option max_jobs_run=* -tc $0 8 | default gpu=0 9 | option gpu=0 -q all.q 10 | option gpu=* -l gpu=$0 -q g.q 11 | default allow_k20=true 12 | option allow_k20=true 13 | option allow_k20=false -l 'hostname=!g01*&!g02*&!b06*' 14 | -------------------------------------------------------------------------------- /egs/README.txt: -------------------------------------------------------------------------------- 1 | 2 | This directory contains example scripts that demonstrate how to 3 | use Kaldi. Each subdirectory corresponds to a corpus that we have 4 | example scripts for. 5 | 6 | Note: we now have some scripts using free data, including voxforge, 7 | vystadial_{cz,en} and yesno. Most of the others are available from 8 | the Linguistic Data Consortium (LDC), which requires money (unless you 9 | have a membership). 10 | 11 | If you have an LDC membership, probably rm/s5 or wsj/s5 should be your first 12 | choice to try out the scripts. 13 | 14 | -------------------------------------------------------------------------------- /egs/csj/s5/local/wer_hyp_filter: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | perl -e 'foreach $w (@ARGV) { $bad{$w} = 1; } 4 | while() { @A = split(" ", $_); $id = shift @A; print "$id "; 5 | foreach $a (@A) { if (!defined $bad{$a}){ @W=split(/\+/,$a); $word=$W[0]; { print "$word "; }}} print "\n"; }' \ 6 | '' '' 7 | 8 | -------------------------------------------------------------------------------- /egs/csj/s5/local/wer_ref_filter: -------------------------------------------------------------------------------- 1 | #!/bin/bash 2 | 3 | perl -e 'foreach $w (@ARGV) { $bad{$w} = 1; } 4 | while() { @A = split(" ", $_); $id = shift @A; print "$id "; 5 | foreach $a (@A) { if (!defined $bad{$a}){ @W=split(/\+/,$a); $word=$W[0]; { print "$word "; }}} print "\n"; }' \ 6 | '' '' 7 | 8 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5/local/bad_segments: -------------------------------------------------------------------------------- 1 | ARABIYA_FROMIRAQ_ARB_20070302_175801_2326286_2327450 2 | ARABIYA_BILARABI_ARB_20061005_201400_221375_223694 3 | LBC_NAHAR_ARB_20060911_142800_3683267_3685290 4 | LBC_NAHAR_ARB_20070303_145800_3249800_3251128 5 | LBC_NAHAR_ARB_20070303_145800_3623646_3624152 6 | LBC_NAHAR_ARB_20070305_035800_481003_484069 7 | ALAM_WITHEVENT_ARB_20070227_205800_3141876_3144152 8 | ALAM_NEWSRPT_ARB_20070130_015801_2875054_2876396 9 | ALJZ_TODHARV_ARB_20060914_155800_2947717_2949041 10 | ALJZ_TODHARV_ARB_20070107_145800_2417848_2419238 11 | -------------------------------------------------------------------------------- /egs/gale_arabic/s5b/local/bad_segments: -------------------------------------------------------------------------------- 1 | ARABIYA_FROMIRAQ_ARB_20070302_175801_2326286_2327450 2 | ARABIYA_BILARABI_ARB_20061005_201400_221375_223694 3 | LBC_NAHAR_ARB_20060911_142800_3683267_3685290 4 | LBC_NAHAR_ARB_20070303_145800_3249800_3251128 5 | LBC_NAHAR_ARB_20070303_145800_3623646_3624152 6 | LBC_NAHAR_ARB_20070305_035800_481003_484069 7 | ALAM_WITHEVENT_ARB_20070227_205800_3141876_3144152 8 | ALAM_NEWSRPT_ARB_20070130_015801_2875054_2876396 9 | ALJZ_TODHARV_ARB_20060914_155800_2947717_2949041 10 | ALJZ_TODHARV_ARB_20070107_145800_2417848_2419238 11 | --------------------------------------------------------------------------------