From 7a576bcac1c37c3c5a59fadf172aa70b15ff83c8 Mon Sep 17 00:00:00 2001 From: yum Date: Fri, 7 Jul 2023 02:30:18 -0700 Subject: Enforce a stricter avg_logbprob than default Common hallucinations sneak in around -0.9 avg_logprob. Also: * Limit temperatures to just 0.0. Multiple values cause latency to occasionally spike. --- Scripts/transcribe.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) (limited to 'Scripts/transcribe.py') diff --git a/Scripts/transcribe.py b/Scripts/transcribe.py index cebd70d..25ce22b 100644 --- a/Scripts/transcribe.py +++ b/Scripts/transcribe.py @@ -278,14 +278,14 @@ def transcribe(audio_state, model, frames, use_cpu: bool) -> typing.Tuple[str,st audio, beam_size = 5, language = audio_state.language, - temperature = [0.0, 0.2, 0.4], - log_prob_threshold = -1.0, + temperature = 0.0, + log_prob_threshold = -0.8, vad_filter = True, condition_on_previous_text = True, without_timestamps = False) ranges = [] for s in segments: - if s.avg_log_prob < -1.0 or s.no_speech_prob > 0.6: + if s.avg_logprob < -0.8 or s.no_speech_prob > 0.6: continue if audio_state.enable_debug_mode: print(f"Segment: {s}") -- cgit v1.2.3