├── .DS_Store
├── LICENSE
├── README.md
├── checkpoints
    ├── .DS_Store
    ├── custom_model
    │   └── empty.txt
    ├── finetuning
    │   └── empty.txt
    └── pretraining
    │   └── empty.txt
├── config
    ├── README.md
    ├── finetuning
    │   ├── base_100h.yaml
    │   └── base_10h.yaml
    ├── hf
    │   └── hf_config.json
    └── pretraining
    │   └── wav2vec2_base_librispeech.yaml
├── data
    ├── .DS_Store
    ├── finetuning
    │   └── empty.txt
    ├── inference
    │   └── empty.txt
    ├── pretraining
    │   └── empty.txt
    └── processed
    │   └── empty.txt
├── lm
    └── empty.txt
├── logs
    ├── .DS_Store
    ├── finetuning
    │   └── empty.txt
    └── pretraining
    │   └── empty.txt
├── notebooks
    └── empty.txt
├── requirements.txt
├── results
    └── empty.txt
├── scripts
    ├── data
    │   └── empty.txt
    ├── finetuning
    │   ├── README.md
    │   ├── prepare_data.sh
    │   └── start_finetuning.sh
    ├── hf
    │   ├── generate_hf_model.sh
    │   └── single_file_inference.sh
    ├── inference
    │   ├── README.md
    │   ├── generate_custom_model.sh
    │   ├── infer.sh
    │   ├── prepare_data.sh
    │   └── single_file_inference.sh
    ├── lm
    │   ├── README.md
    │   └── run_lm_pipeline.sh
    ├── parse_yaml.sh
    ├── pretraining
    │   ├── README.md
    │   ├── prepare_data.sh
    │   ├── start_pretraining_base.sh
    │   └── start_pretraining_large.sh
    └── torchscript
    │   └── convert_hf.sh
├── setup_new_env.sh
├── tests
    ├── finetuning
    │   ├── README.md
    │   ├── prepare_data.sh
    │   ├── start_finetuning_new.sh
    │   └── start_finetuning_old.sh
    └── inference
    │   ├── .infer.sh.swp
    │   ├── README.md
    │   ├── generate_custom_model.sh
    │   ├── generate_eng_model.sh
    │   ├── generate_hindi_model.sh
    │   ├── infer.sh
    │   ├── infer_english.sh
    │   ├── infer_hindi.sh
    │   ├── prepare_data.sh
    │   ├── single_eng.sh
    │   ├── single_file_inference.sh
    │   └── single_hindi.sh
└── utils
    ├── analysis
        ├── generate_dict_analysis.py
        └── generate_wav_report_from_tsv.py
    ├── clean_dir
        └── clean_directories.py
    ├── hf
        ├── convert_to_hf.py
        └── single_file_inference.py
    ├── inference
        ├── generate_custom_model.py
        ├── infer.py
        ├── save_predicted_output.py
        ├── single_file_inference.py
        └── update_model.py
    ├── lm
        ├── clean_text.py
        ├── concatenate_text.py
        ├── generate_lm.py
        ├── make_lexicon_lst.py
        └── remove_duplicate_lines.py
    ├── prep_scripts
        ├── dict_and_lexicon_maker.py
        ├── labels.py
        └── manifest.py
    ├── torchscript
        └── convert_hf.py
    └── wer
        ├── components.py
        ├── wer.py
        └── wer_wav2vec.py


/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/.DS_Store


--------------------------------------------------------------------------------
/LICENSE:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/LICENSE


--------------------------------------------------------------------------------
/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/README.md


--------------------------------------------------------------------------------
/checkpoints/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/checkpoints/.DS_Store


--------------------------------------------------------------------------------
/checkpoints/custom_model/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/checkpoints/finetuning/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/checkpoints/pretraining/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/config/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/config/README.md


--------------------------------------------------------------------------------
/config/finetuning/base_100h.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/config/finetuning/base_100h.yaml


--------------------------------------------------------------------------------
/config/finetuning/base_10h.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/config/finetuning/base_10h.yaml


--------------------------------------------------------------------------------
/config/hf/hf_config.json:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/config/hf/hf_config.json


--------------------------------------------------------------------------------
/config/pretraining/wav2vec2_base_librispeech.yaml:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/config/pretraining/wav2vec2_base_librispeech.yaml


--------------------------------------------------------------------------------
/data/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/data/.DS_Store


--------------------------------------------------------------------------------
/data/finetuning/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/data/inference/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/data/pretraining/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/data/processed/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/lm/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/logs/.DS_Store:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/logs/.DS_Store


--------------------------------------------------------------------------------
/logs/finetuning/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/logs/pretraining/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/notebooks/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/requirements.txt:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/requirements.txt


--------------------------------------------------------------------------------
/results/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/scripts/data/empty.txt:
--------------------------------------------------------------------------------
1 | 


--------------------------------------------------------------------------------
/scripts/finetuning/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/finetuning/README.md


--------------------------------------------------------------------------------
/scripts/finetuning/prepare_data.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/finetuning/prepare_data.sh


--------------------------------------------------------------------------------
/scripts/finetuning/start_finetuning.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/finetuning/start_finetuning.sh


--------------------------------------------------------------------------------
/scripts/hf/generate_hf_model.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/hf/generate_hf_model.sh


--------------------------------------------------------------------------------
/scripts/hf/single_file_inference.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/hf/single_file_inference.sh


--------------------------------------------------------------------------------
/scripts/inference/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/inference/README.md


--------------------------------------------------------------------------------
/scripts/inference/generate_custom_model.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/inference/generate_custom_model.sh


--------------------------------------------------------------------------------
/scripts/inference/infer.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/inference/infer.sh


--------------------------------------------------------------------------------
/scripts/inference/prepare_data.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/inference/prepare_data.sh


--------------------------------------------------------------------------------
/scripts/inference/single_file_inference.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/inference/single_file_inference.sh


--------------------------------------------------------------------------------
/scripts/lm/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/lm/README.md


--------------------------------------------------------------------------------
/scripts/lm/run_lm_pipeline.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/lm/run_lm_pipeline.sh


--------------------------------------------------------------------------------
/scripts/parse_yaml.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/parse_yaml.sh


--------------------------------------------------------------------------------
/scripts/pretraining/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/pretraining/README.md


--------------------------------------------------------------------------------
/scripts/pretraining/prepare_data.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/pretraining/prepare_data.sh


--------------------------------------------------------------------------------
/scripts/pretraining/start_pretraining_base.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/pretraining/start_pretraining_base.sh


--------------------------------------------------------------------------------
/scripts/pretraining/start_pretraining_large.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/pretraining/start_pretraining_large.sh


--------------------------------------------------------------------------------
/scripts/torchscript/convert_hf.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/scripts/torchscript/convert_hf.sh


--------------------------------------------------------------------------------
/setup_new_env.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/setup_new_env.sh


--------------------------------------------------------------------------------
/tests/finetuning/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/finetuning/README.md


--------------------------------------------------------------------------------
/tests/finetuning/prepare_data.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/finetuning/prepare_data.sh


--------------------------------------------------------------------------------
/tests/finetuning/start_finetuning_new.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/finetuning/start_finetuning_new.sh


--------------------------------------------------------------------------------
/tests/finetuning/start_finetuning_old.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/finetuning/start_finetuning_old.sh


--------------------------------------------------------------------------------
/tests/inference/.infer.sh.swp:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/.infer.sh.swp


--------------------------------------------------------------------------------
/tests/inference/README.md:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/README.md


--------------------------------------------------------------------------------
/tests/inference/generate_custom_model.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/generate_custom_model.sh


--------------------------------------------------------------------------------
/tests/inference/generate_eng_model.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/generate_eng_model.sh


--------------------------------------------------------------------------------
/tests/inference/generate_hindi_model.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/generate_hindi_model.sh


--------------------------------------------------------------------------------
/tests/inference/infer.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/infer.sh


--------------------------------------------------------------------------------
/tests/inference/infer_english.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/infer_english.sh


--------------------------------------------------------------------------------
/tests/inference/infer_hindi.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/infer_hindi.sh


--------------------------------------------------------------------------------
/tests/inference/prepare_data.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/prepare_data.sh


--------------------------------------------------------------------------------
/tests/inference/single_eng.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/single_eng.sh


--------------------------------------------------------------------------------
/tests/inference/single_file_inference.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/single_file_inference.sh


--------------------------------------------------------------------------------
/tests/inference/single_hindi.sh:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/tests/inference/single_hindi.sh


--------------------------------------------------------------------------------
/utils/analysis/generate_dict_analysis.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/analysis/generate_dict_analysis.py


--------------------------------------------------------------------------------
/utils/analysis/generate_wav_report_from_tsv.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/analysis/generate_wav_report_from_tsv.py


--------------------------------------------------------------------------------
/utils/clean_dir/clean_directories.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/clean_dir/clean_directories.py


--------------------------------------------------------------------------------
/utils/hf/convert_to_hf.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/hf/convert_to_hf.py


--------------------------------------------------------------------------------
/utils/hf/single_file_inference.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/hf/single_file_inference.py


--------------------------------------------------------------------------------
/utils/inference/generate_custom_model.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/inference/generate_custom_model.py


--------------------------------------------------------------------------------
/utils/inference/infer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/inference/infer.py


--------------------------------------------------------------------------------
/utils/inference/save_predicted_output.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/inference/save_predicted_output.py


--------------------------------------------------------------------------------
/utils/inference/single_file_inference.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/inference/single_file_inference.py


--------------------------------------------------------------------------------
/utils/inference/update_model.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/inference/update_model.py


--------------------------------------------------------------------------------
/utils/lm/clean_text.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/lm/clean_text.py


--------------------------------------------------------------------------------
/utils/lm/concatenate_text.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/lm/concatenate_text.py


--------------------------------------------------------------------------------
/utils/lm/generate_lm.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/lm/generate_lm.py


--------------------------------------------------------------------------------
/utils/lm/make_lexicon_lst.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/lm/make_lexicon_lst.py


--------------------------------------------------------------------------------
/utils/lm/remove_duplicate_lines.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/lm/remove_duplicate_lines.py


--------------------------------------------------------------------------------
/utils/prep_scripts/dict_and_lexicon_maker.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/prep_scripts/dict_and_lexicon_maker.py


--------------------------------------------------------------------------------
/utils/prep_scripts/labels.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/prep_scripts/labels.py


--------------------------------------------------------------------------------
/utils/prep_scripts/manifest.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/prep_scripts/manifest.py


--------------------------------------------------------------------------------
/utils/torchscript/convert_hf.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/torchscript/convert_hf.py


--------------------------------------------------------------------------------
/utils/wer/components.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/wer/components.py


--------------------------------------------------------------------------------
/utils/wer/wer.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/wer/wer.py


--------------------------------------------------------------------------------
/utils/wer/wer_wav2vec.py:
--------------------------------------------------------------------------------
https://raw.githubusercontent.com/Open-Speech-EkStep/vakyansh-wav2vec2-experimentation/HEAD/utils/wer/wer_wav2vec.py


--------------------------------------------------------------------------------