summaryrefslogtreecommitdiffstats
path: root/transcribe.py
diff options
context:
space:
mode:
authoryum <yum.food.vr@gmail.com>2022-11-10 21:21:07 -0800
committeryum <yum.food.vr@gmail.com>2022-11-10 21:21:07 -0800
commit772b44806a5f5da11cca74c99b59c3cf7d5ceae5 (patch)
treeaba2f690b4be58aaa4c0c0f26443ba5085deca63 /transcribe.py
parent2efc87a7180ec6e92127d22d1a3eb8c44fd392db (diff)
License scrub
Begin auditing dependencies' licenses.
Diffstat (limited to 'transcribe.py')
-rw-r--r--transcribe.py35
1 files changed, 21 insertions, 14 deletions
diff --git a/transcribe.py b/transcribe.py
index e96d794..2e4457e 100644
--- a/transcribe.py
+++ b/transcribe.py
@@ -6,9 +6,11 @@ import string_matcher
import os
import osc_ctrl
# python3 -m pip install pydub
+# License: MIT.
from pydub import AudioSegment as pydub_AudioSegment
from pydub import effects as pydub_effects
# python3 -m pip install pyaudio
+# License: MIT.
import pyaudio
import sys
import threading
@@ -16,6 +18,7 @@ import time
import wave
# python3 -m pip install git+https://github.com/openai/whisper.git
# python3 -m pip install torch -f https://download.pytorch.org/whl/torch_stable.html
+# License: MIT.
import whisper
class AudioState:
@@ -270,20 +273,9 @@ def sendAudio(audio_state):
# Pace this out
time.sleep(0.01)
-if __name__ == "__main__":
- parser = argparse.ArgumentParser()
- parser.add_argument("--mic", type=str, help="Which mic to use. Options: index, focusrite. Default: index")
- parser.add_argument("--language", type=str, help="Which language to use. Ex: english, japanese, chinese, french, german.")
- args = parser.parse_args()
-
- if not args.mic:
- args.mic = "index"
-
- if not args.language:
- args.language = "english"
-
- audio_state = getMicStream(args.mic)
- audio_state.language = whisper.tokenizer.TO_LANGUAGE_CODE[args.language]
+def transcribeLoop(mic: str, language: str):
+ audio_state = getMicStream(mic)
+ audio_state.language = whisper.tokenizer.TO_LANGUAGE_CODE[language]
if os.path.isfile(audio_state.VOICE_AUDIO_FILENAME):
# empty out the voice file
@@ -318,3 +310,18 @@ if __name__ == "__main__":
record_audio_thd.join()
transcribe_audio_thd.join()
+
+if __name__ == "__main__":
+ parser = argparse.ArgumentParser()
+ parser.add_argument("--mic", type=str, help="Which mic to use. Options: index, focusrite. Default: index")
+ parser.add_argument("--language", type=str, help="Which language to use. Ex: english, japanese, chinese, french, german.")
+ args = parser.parse_args()
+
+ if not args.mic:
+ args.mic = "index"
+
+ if not args.language:
+ args.language = "english"
+
+ transcribeLoop(args.mic, args.language)
+