summaryrefslogtreecommitdiffstats
path: root/Whisper/API
diff options
context:
space:
mode:
authoryum <yum.food.vr@gmail.com>2023-02-26 19:42:33 -0800
committeryum <yum.food.vr@gmail.com>2023-02-26 20:09:15 -0800
commit1136acfc365f357d2df13a263714e8ae0614c4f9 (patch)
tree6109149806673ade4505d956b09d1996034f7cab /Whisper/API
parent02c2605454288f7c86023ae700366acf08cd2206 (diff)
Add retainDuration option to CaptureParams
This allows users to retain a suffix of the PCM buffer after a VAD segmentation event, reducing some instances of words being lost at the start of the next VAD window.
Diffstat (limited to 'Whisper/API')
-rw-r--r--Whisper/API/MfStructs.h3
1 files changed, 3 insertions, 0 deletions
diff --git a/Whisper/API/MfStructs.h b/Whisper/API/MfStructs.h
index 39255de..c23d633 100644
--- a/Whisper/API/MfStructs.h
+++ b/Whisper/API/MfStructs.h
@@ -28,6 +28,9 @@ namespace Whisper
float maxDuration = 3.0f;
float dropStartSilence = 0.25f;
float pauseDuration = 0.333f;
+ // After audio is segmented using VAD, as many as this many seconds of
+ // audio will be retained as the input to the next transcription window.
+ float retainDuration = 0.25f;
// Flags for the audio capture
uint32_t flags = 0;
};