Tweak transcription heuristics

The heuristics now occur in the filtered word space, so punctuation and casing changes won't confound them.
author: yum <yum.food.vr@gmail.com> 2022-10-25 16:31:20 -0700
committer: yum <yum.food.vr@gmail.com> 2022-10-25 16:31:20 -0700
commit: f84d83b611b751d20c9b7b983c4a90e389117a6b (patch)
tree: c2d1400f2ce688b336a6e39967a7853e15500eca /transcribe.py
parent: 98284cc0ca42c75ef8cf22d9435821c62a12c592 (diff)
1 files changed, 13 insertions, 3 deletions
diff --git a/transcribe.py b/transcribe.py
index 520d63e..99429c6 100644
--- a/transcribe.py
+++ b/transcribe.py
@@ -231,11 +231,21 @@ def transcribeAudio(audio_state, model):
         #   3. If the transcription is somewhat long and the
         #       first few characters change, we assume this is due to a
         #       trim event and immediately accept the transcription.
+        candidate_words = ''.join(c for c in audio_state.text_candidate.lower() if (c.isalpha() or c == " ")).split()
+
+        candidate_words_are_prefix_of_text = False
+        if len(candidate_words) < len(words) and \
+                candidate_words == words[0:len(candidate_words)]:
+            candidate_words_are_prefix_of_text = True
+
         commit_transcription = False
-        if text == audio_state.text_candidate or text.startswith(audio_state.text_candidate):
-            commit_transcription = True
-        elif len(text) > 30 and len(audio_state.text_candidate) >= 10 and text[0:10] != audio_state.text_candidate[0:10]:
+        if words == candidate_words or candidate_words_are_prefix_of_text:
             commit_transcription = True
+        elif len(text) > 30 and len(audio_state.text_candidate) >= 10:
+            d = levenshtein_distance(text[0:10],
+                    audio_state.text_candidate[0:10])
+            if d > 2:
+                commit_transcription = True
 
         print("Transcription: {}".format(audio_state.text))
author	yum <yum.food.vr@gmail.com>	2022-10-25 16:31:20 -0700
committer	yum <yum.food.vr@gmail.com>	2022-10-25 16:31:20 -0700
commit	f84d83b611b751d20c9b7b983c4a90e389117a6b (patch)
tree	c2d1400f2ce688b336a6e39967a7853e15500eca /transcribe.py
parent	98284cc0ca42c75ef8cf22d9435821c62a12c592 (diff)