├── .gitignore ├── CITATION.cff ├── LICENSE ├── README.md ├── evaluation.md ├── images ├── ASR-Comparison-2021.png ├── ASR-Comparison-2022.png └── ASR-Comparison.png └── src ├── chart ├── comparison.js └── index.html ├── datasets ├── common_voice │ ├── README.md │ └── common_voice.py ├── magic_data │ └── magic_data.py ├── magic_data_conversation │ └── magic_data_conversation.py └── titml │ └── titml.py ├── id.json ├── jv.json ├── jv_su.json ├── jv_su_id.json ├── jv_su_id_500.json ├── jv_su_id_all.json ├── run_evaluation.py ├── run_evaluation_google.py ├── run_finetuning.py ├── run_finetuning_id.sh ├── run_finetuning_jv.sh ├── run_finetuning_jv_su.sh ├── run_finetuning_jv_su_id.sh ├── run_finetuning_jv_su_id_all.sh ├── run_finetuning_su.sh ├── su.json ├── tools └── magic_data_conversion.py ├── transcription_google.tsv └── util ├── currency.tsv ├── measurements.tsv ├── text_processor.py └── timezones.tsv /.gitignore: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/.gitignore -------------------------------------------------------------------------------- /CITATION.cff: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/CITATION.cff -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/README.md -------------------------------------------------------------------------------- /evaluation.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/evaluation.md -------------------------------------------------------------------------------- /images/ASR-Comparison-2021.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/images/ASR-Comparison-2021.png -------------------------------------------------------------------------------- /images/ASR-Comparison-2022.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/images/ASR-Comparison-2022.png -------------------------------------------------------------------------------- /images/ASR-Comparison.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/images/ASR-Comparison.png -------------------------------------------------------------------------------- /src/chart/comparison.js: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/chart/comparison.js -------------------------------------------------------------------------------- /src/chart/index.html: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/chart/index.html -------------------------------------------------------------------------------- /src/datasets/common_voice/README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/datasets/common_voice/README.md -------------------------------------------------------------------------------- /src/datasets/common_voice/common_voice.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/datasets/common_voice/common_voice.py -------------------------------------------------------------------------------- /src/datasets/magic_data/magic_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/datasets/magic_data/magic_data.py -------------------------------------------------------------------------------- /src/datasets/magic_data_conversation/magic_data_conversation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/datasets/magic_data_conversation/magic_data_conversation.py -------------------------------------------------------------------------------- /src/datasets/titml/titml.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/datasets/titml/titml.py -------------------------------------------------------------------------------- /src/id.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/id.json -------------------------------------------------------------------------------- /src/jv.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/jv.json -------------------------------------------------------------------------------- /src/jv_su.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/jv_su.json -------------------------------------------------------------------------------- /src/jv_su_id.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/jv_su_id.json -------------------------------------------------------------------------------- /src/jv_su_id_500.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/jv_su_id_500.json -------------------------------------------------------------------------------- /src/jv_su_id_all.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/jv_su_id_all.json -------------------------------------------------------------------------------- /src/run_evaluation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_evaluation.py -------------------------------------------------------------------------------- /src/run_evaluation_google.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_evaluation_google.py -------------------------------------------------------------------------------- /src/run_finetuning.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning.py -------------------------------------------------------------------------------- /src/run_finetuning_id.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning_id.sh -------------------------------------------------------------------------------- /src/run_finetuning_jv.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning_jv.sh -------------------------------------------------------------------------------- /src/run_finetuning_jv_su.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning_jv_su.sh -------------------------------------------------------------------------------- /src/run_finetuning_jv_su_id.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning_jv_su_id.sh -------------------------------------------------------------------------------- /src/run_finetuning_jv_su_id_all.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning_jv_su_id_all.sh -------------------------------------------------------------------------------- /src/run_finetuning_su.sh: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/run_finetuning_su.sh -------------------------------------------------------------------------------- /src/su.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/su.json -------------------------------------------------------------------------------- /src/tools/magic_data_conversion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/tools/magic_data_conversion.py -------------------------------------------------------------------------------- /src/transcription_google.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/transcription_google.tsv -------------------------------------------------------------------------------- /src/util/currency.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/util/currency.tsv -------------------------------------------------------------------------------- /src/util/measurements.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/util/measurements.tsv -------------------------------------------------------------------------------- /src/util/text_processor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/util/text_processor.py -------------------------------------------------------------------------------- /src/util/timezones.tsv: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/indonesian-nlp/multilingual-asr/HEAD/src/util/timezones.tsv --------------------------------------------------------------------------------