diff options
| author | yum <yum.food.vr@gmail.com> | 2023-07-07 02:30:18 -0700 |
|---|---|---|
| committer | yum <yum.food.vr@gmail.com> | 2023-07-07 02:35:51 -0700 |
| commit | 7a576bcac1c37c3c5a59fadf172aa70b15ff83c8 (patch) | |
| tree | e7fa6e499e3bc12ddf4096aad30f2705f34ce556 /Scripts/transcribe.py | |
| parent | 2793ac9dd31059f2fc29f7978bcb688a7de664ed (diff) | |
Enforce a stricter avg_logbprob than defaultv0.13.1
Common hallucinations sneak in around -0.9 avg_logprob.
Also:
* Limit temperatures to just 0.0. Multiple values cause latency to
occasionally spike.
Diffstat (limited to 'Scripts/transcribe.py')
| -rw-r--r-- | Scripts/transcribe.py | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/Scripts/transcribe.py b/Scripts/transcribe.py index cebd70d..25ce22b 100644 --- a/Scripts/transcribe.py +++ b/Scripts/transcribe.py @@ -278,14 +278,14 @@ def transcribe(audio_state, model, frames, use_cpu: bool) -> typing.Tuple[str,st audio, beam_size = 5, language = audio_state.language, - temperature = [0.0, 0.2, 0.4], - log_prob_threshold = -1.0, + temperature = 0.0, + log_prob_threshold = -0.8, vad_filter = True, condition_on_previous_text = True, without_timestamps = False) ranges = [] for s in segments: - if s.avg_log_prob < -1.0 or s.no_speech_prob > 0.6: + if s.avg_logprob < -0.8 or s.no_speech_prob > 0.6: continue if audio_state.enable_debug_mode: print(f"Segment: {s}") |
