diff options
| author | yum <yum.food.vr@gmail.com> | 2022-11-10 21:21:07 -0800 |
|---|---|---|
| committer | yum <yum.food.vr@gmail.com> | 2022-11-10 21:21:07 -0800 |
| commit | 772b44806a5f5da11cca74c99b59c3cf7d5ceae5 (patch) | |
| tree | aba2f690b4be58aaa4c0c0f26443ba5085deca63 /transcribe.py | |
| parent | 2efc87a7180ec6e92127d22d1a3eb8c44fd392db (diff) | |
License scrub
Begin auditing dependencies' licenses.
Diffstat (limited to 'transcribe.py')
| -rw-r--r-- | transcribe.py | 35 |
1 files changed, 21 insertions, 14 deletions
diff --git a/transcribe.py b/transcribe.py index e96d794..2e4457e 100644 --- a/transcribe.py +++ b/transcribe.py @@ -6,9 +6,11 @@ import string_matcher import os import osc_ctrl # python3 -m pip install pydub +# License: MIT. from pydub import AudioSegment as pydub_AudioSegment from pydub import effects as pydub_effects # python3 -m pip install pyaudio +# License: MIT. import pyaudio import sys import threading @@ -16,6 +18,7 @@ import time import wave # python3 -m pip install git+https://github.com/openai/whisper.git # python3 -m pip install torch -f https://download.pytorch.org/whl/torch_stable.html +# License: MIT. import whisper class AudioState: @@ -270,20 +273,9 @@ def sendAudio(audio_state): # Pace this out time.sleep(0.01) -if __name__ == "__main__": - parser = argparse.ArgumentParser() - parser.add_argument("--mic", type=str, help="Which mic to use. Options: index, focusrite. Default: index") - parser.add_argument("--language", type=str, help="Which language to use. Ex: english, japanese, chinese, french, german.") - args = parser.parse_args() - - if not args.mic: - args.mic = "index" - - if not args.language: - args.language = "english" - - audio_state = getMicStream(args.mic) - audio_state.language = whisper.tokenizer.TO_LANGUAGE_CODE[args.language] +def transcribeLoop(mic: str, language: str): + audio_state = getMicStream(mic) + audio_state.language = whisper.tokenizer.TO_LANGUAGE_CODE[language] if os.path.isfile(audio_state.VOICE_AUDIO_FILENAME): # empty out the voice file @@ -318,3 +310,18 @@ if __name__ == "__main__": record_audio_thd.join() transcribe_audio_thd.join() + +if __name__ == "__main__": + parser = argparse.ArgumentParser() + parser.add_argument("--mic", type=str, help="Which mic to use. Options: index, focusrite. Default: index") + parser.add_argument("--language", type=str, help="Which language to use. Ex: english, japanese, chinese, french, german.") + args = parser.parse_args() + + if not args.mic: + args.mic = "index" + + if not args.language: + args.language = "english" + + transcribeLoop(args.mic, args.language) + |
