diff options
| author | yum <yum.food.vr@gmail.com> | 2024-02-05 17:01:12 -0800 |
|---|---|---|
| committer | yum <yum.food.vr@gmail.com> | 2024-02-05 17:02:23 -0800 |
| commit | acccf8ebcff0f7cc2b26e45e497f8b12ab73d8e1 (patch) | |
| tree | 8c095c115b4b3447863a304d9a0f32f4e46e577f /Scripts/transcribe_v2.py | |
| parent | 33db3dcc23a45cae611bcf839c33d6615ccbf59e (diff) | |
Verify that audio is clean after VAD segmentation
Indeed it is. Bumped up the default max segment length to decrease
error.
Also add mic presets for beyond (the vr headset) and motu (my mic
interface).
Diffstat (limited to 'Scripts/transcribe_v2.py')
| -rw-r--r-- | Scripts/transcribe_v2.py | 9 |
1 files changed, 5 insertions, 4 deletions
diff --git a/Scripts/transcribe_v2.py b/Scripts/transcribe_v2.py index 491bc35..65a0cf8 100644 --- a/Scripts/transcribe_v2.py +++ b/Scripts/transcribe_v2.py @@ -337,7 +337,7 @@ class AudioSegmenter: # Returns the stable cutoff (if any) and whether there are any segments. def getStableCutoff(self, audio: bytes) -> typing.Tuple[int, bool]: min_delta_frames = int((self.vad_options.min_silence_duration_ms * - AudioStream.FPS) / 1000) + AudioStream.FPS) / 1000.0) cutoff = None last_end = None @@ -515,9 +515,10 @@ class VadCommitter: print(f"commit segment: {s}", file=sys.stderr) print(f"delta get: {delta}", file=sys.stderr) - #ts = datetime.fromtimestamp(self.collector.now() - latency_s) - #filename = str(ts.strftime('%Y_%m_%d__%H-%M-%S')) + ".wav" - #saveAudio(commit_audio, filename) + if True: + ts = datetime.fromtimestamp(self.collector.now() - latency_s) + filename = str(ts.strftime('%Y_%m_%d__%H-%M-%S')) + ".wav" + saveAudio(commit_audio, filename) preview = "" if self.cfg["enable_previews"] and has_audio: |
