From e1730a63538d2b1a23c948d25580612303733eba Mon Sep 17 00:00:00 2001 From: yum Date: Wed, 23 Jul 2025 19:51:35 -0700 Subject: Update avg_logprob cutoff, fix sounds, fix electron build --- app/stt.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) (limited to 'app') diff --git a/app/stt.py b/app/stt.py index f36de97..b476ac0 100644 --- a/app/stt.py +++ b/app/stt.py @@ -523,6 +523,13 @@ class Whisper: f"no_speech_prob={s.no_speech_prob}, " + f"avg_logprob={s.avg_logprob})", file=sys.stderr) continue + if s.avg_logprob < -0.75: + if self.cfg["enable_debug_mode"]: + print(f"Drop probable hallucination (case 3) " + + f"(text='{s.text}', " + + f"no_speech_prob={s.no_speech_prob}, " + + f"avg_logprob={s.avg_logprob})", file=sys.stderr) + continue if self.cfg["enable_debug_mode"]: print(f"s get: {s}") if s.avg_logprob < -1.0: @@ -686,7 +693,7 @@ class VadCommitter: if self.cfg["save_audio"] and len(delta) > 0: ts = datetime.fromtimestamp(self.collector.now() - latency_s) - filename = str(ts.strftime('%Y_%m_%d__%H-%M-%S')) + ".wav" + filename = str(ts.strftime('%Y_%m_%d__%H-%M-%S')) + delta.strip() + ".wav" audio_dir = os.path.join(PROJECT_ROOT, "audio") if not os.path.exists(audio_dir): os.makedirs(audio_dir) -- cgit v1.2.3