Shorten audio window to 10 seconds

This helps with temporal stability in long-running transcriptions, and lets us get rid of that hack where we refuse to update old pages.
author: yum <yum.food.vr@gmail.com> 2022-11-22 19:01:01 -0800
committer: yum <yum.food.vr@gmail.com> 2022-11-22 19:01:01 -0800
commit: 9f87674d1b484a2e61e87ad53d8ebcf9985dce6b (patch)
tree: b3e8958a5a28901f1ecb9409db22ba15dba00a77 /transcribe.py
parent: a7a52b884061b154eaae6b0a8c0d5b443cbb8abe (diff)
1 files changed, 3 insertions, 2 deletions
diff --git a/transcribe.py b/transcribe.py
index 91fcd54..b316014 100644
--- a/transcribe.py
+++ b/transcribe.py
@@ -33,7 +33,8 @@ class AudioState:
 
     # The maximum length that recordAudio() will put into frames before it
     # starts dropping from the start.
-    MAX_LENGTH_S = 30
+    MAX_LENGTH_S = 10
+    MAX_LENGTH_S_WHISPER = 30
     # The minimum length that recordAudio() will wait for before saving audio.
     MIN_LENGTH_S = 1
 
@@ -202,7 +203,7 @@ def transcribe(audio_state, model, filename):
     audio_state.transcribe_lock.release()
 
     audio = whisper.pad_or_trim(audio, length = audio_state.RATE *
-            audio_state.MAX_LENGTH_S)
+            audio_state.MAX_LENGTH_S_WHISPER)
     mel = whisper.log_mel_spectrogram(audio).to(model.device)
 
     result = None
author	yum <yum.food.vr@gmail.com>	2022-11-22 19:01:01 -0800
committer	yum <yum.food.vr@gmail.com>	2022-11-22 19:01:01 -0800
commit	9f87674d1b484a2e61e87ad53d8ebcf9985dce6b (patch)
tree	b3e8958a5a28901f1ecb9409db22ba15dba00a77 /transcribe.py
parent	a7a52b884061b154eaae6b0a8c0d5b443cbb8abe (diff)