diff options
| -rw-r--r-- | Scripts/requirements.txt | 2 | ||||
| -rw-r--r-- | Scripts/transcribe.py | 6 |
2 files changed, 4 insertions, 4 deletions
diff --git a/Scripts/requirements.txt b/Scripts/requirements.txt index 647e942..80bf93d 100644 --- a/Scripts/requirements.txt +++ b/Scripts/requirements.txt @@ -1,6 +1,6 @@ ctranslate2 editdistance -faster-whisper@https://github.com/guillaumekln/faster-whisper/archive/358d373691c95205021bd4bbf28cde7ce4d10030.tar.gz +faster-whisper@https://github.com/guillaumekln/faster-whisper/archive/78d57d73c5b4a76b32d1d5a415e4e7aea760295c.tar.gz future==0.18.2 keyboard langcodes diff --git a/Scripts/transcribe.py b/Scripts/transcribe.py index cebd70d..25ce22b 100644 --- a/Scripts/transcribe.py +++ b/Scripts/transcribe.py @@ -278,14 +278,14 @@ def transcribe(audio_state, model, frames, use_cpu: bool) -> typing.Tuple[str,st audio, beam_size = 5, language = audio_state.language, - temperature = [0.0, 0.2, 0.4], - log_prob_threshold = -1.0, + temperature = 0.0, + log_prob_threshold = -0.8, vad_filter = True, condition_on_previous_text = True, without_timestamps = False) ranges = [] for s in segments: - if s.avg_log_prob < -1.0 or s.no_speech_prob > 0.6: + if s.avg_logprob < -0.8 or s.no_speech_prob > 0.6: continue if audio_state.enable_debug_mode: print(f"Segment: {s}") |
