├── .gitignore ├── LICENSE ├── README.md ├── careless_whisper_stream ├── __init__.py ├── __main__.py ├── assets │ ├── gpt2.tiktoken │ ├── mel_filters.npz │ └── multilingual.tiktoken ├── audio.py ├── decoding.py ├── model.py ├── normalizers │ ├── __init__.py │ ├── basic.py │ ├── english.json │ └── english.py ├── streaming_decoding.py ├── streaming_model.py ├── streaming_transcribe.py ├── timing.py ├── tokenizer.py ├── transcribe.py ├── triton_ops.py ├── utils.py └── version.py ├── environment.yml ├── requirements.txt ├── tests ├── jfk.wav └── streaming_transcription.py ├── training_code ├── __init__.py ├── collators.py ├── datasets_classes.py ├── ds_dict.py ├── train.py ├── utils.py └── whisper_module.py └── transcribe.py /.gitignore: -------------------------------------------------------------------------------- 1 | *.ipynb 2 | __pycache__/ 3 | notebooks/ 4 | static/ -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/README.md -------------------------------------------------------------------------------- /careless_whisper_stream/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/__init__.py -------------------------------------------------------------------------------- /careless_whisper_stream/__main__.py: -------------------------------------------------------------------------------- 1 | from .streaming_transcribe import cli 2 | 3 | cli() 4 | -------------------------------------------------------------------------------- /careless_whisper_stream/assets/gpt2.tiktoken: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/assets/gpt2.tiktoken -------------------------------------------------------------------------------- /careless_whisper_stream/assets/mel_filters.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/assets/mel_filters.npz -------------------------------------------------------------------------------- /careless_whisper_stream/assets/multilingual.tiktoken: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/assets/multilingual.tiktoken -------------------------------------------------------------------------------- /careless_whisper_stream/audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/audio.py -------------------------------------------------------------------------------- /careless_whisper_stream/decoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/decoding.py -------------------------------------------------------------------------------- /careless_whisper_stream/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/model.py -------------------------------------------------------------------------------- /careless_whisper_stream/normalizers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/normalizers/__init__.py -------------------------------------------------------------------------------- /careless_whisper_stream/normalizers/basic.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/normalizers/basic.py -------------------------------------------------------------------------------- /careless_whisper_stream/normalizers/english.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/normalizers/english.json -------------------------------------------------------------------------------- /careless_whisper_stream/normalizers/english.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/normalizers/english.py -------------------------------------------------------------------------------- /careless_whisper_stream/streaming_decoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/streaming_decoding.py -------------------------------------------------------------------------------- /careless_whisper_stream/streaming_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/streaming_model.py -------------------------------------------------------------------------------- /careless_whisper_stream/streaming_transcribe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/streaming_transcribe.py -------------------------------------------------------------------------------- /careless_whisper_stream/timing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/timing.py -------------------------------------------------------------------------------- /careless_whisper_stream/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/tokenizer.py -------------------------------------------------------------------------------- /careless_whisper_stream/transcribe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/transcribe.py -------------------------------------------------------------------------------- /careless_whisper_stream/triton_ops.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/triton_ops.py -------------------------------------------------------------------------------- /careless_whisper_stream/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/careless_whisper_stream/utils.py -------------------------------------------------------------------------------- /careless_whisper_stream/version.py: -------------------------------------------------------------------------------- 1 | __version__ = "20231117" 2 | -------------------------------------------------------------------------------- /environment.yml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/environment.yml -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/requirements.txt -------------------------------------------------------------------------------- /tests/jfk.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/tests/jfk.wav -------------------------------------------------------------------------------- /tests/streaming_transcription.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/tests/streaming_transcription.py -------------------------------------------------------------------------------- /training_code/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /training_code/collators.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/training_code/collators.py -------------------------------------------------------------------------------- /training_code/datasets_classes.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/training_code/datasets_classes.py -------------------------------------------------------------------------------- /training_code/ds_dict.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/training_code/ds_dict.py -------------------------------------------------------------------------------- /training_code/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/training_code/train.py -------------------------------------------------------------------------------- /training_code/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/training_code/utils.py -------------------------------------------------------------------------------- /training_code/whisper_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/training_code/whisper_module.py -------------------------------------------------------------------------------- /transcribe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/tomer9080/CarelessWhisper-Streaming/HEAD/transcribe.py --------------------------------------------------------------------------------