From 113f2858016c252b97cac96eab454ee16b2dcda2 Mon Sep 17 00:00:00 2001 From: yum Date: Thu, 27 Oct 2022 19:15:48 -0700 Subject: Tweak continuous transcription Stitching new uses 6 word sliding window instead of 4 word. Seems to dramatically improve transcription quality. --- string_matcher.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) (limited to 'string_matcher.py') diff --git a/string_matcher.py b/string_matcher.py index 458244b..17bfaac 100644 --- a/string_matcher.py +++ b/string_matcher.py @@ -8,7 +8,7 @@ import typing # Find the window where the distance between these two transcriptions is # minimized and use it to stitch them together. def matchStringList(old_words: typing.List[str], - new_words: typing.List[str], window_size = 4) -> str: + new_words: typing.List[str], window_size = 6) -> str: if old_words == new_words: return " ".join(old_words) elif len(old_words) >= window_size and len(new_words) >= window_size: -- cgit v1.2.3