From f97cef182de55b6dbae8d2bc0477acfca6cc1f66 Mon Sep 17 00:00:00 2001 From: yum Date: Thu, 29 May 2025 19:45:48 -0700 Subject: More UI work 1. main STT app works in new project structure 2. UI dumps mics on startup to populate mic list 3. add missing deps (hf-xet, wave) 4. normalize audio volume when transcribing. Probably still wrong tbqh. 5. add checkbox to save audio segments & improve logic so only segments with speech get saved. 6. add default config settings --- config.yaml | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) (limited to 'config.yaml') diff --git a/config.yaml b/config.yaml index 164b4e6..34d88f1 100644 --- a/config.yaml +++ b/config.yaml @@ -1,18 +1,17 @@ -compute_type: int8 +compute_type: float16 enable_debug_mode: 0 enable_previews: 1 +save_audio: 0 language: english gpu_idx: 0 max_speech_duration_s: 10 min_silence_duration_ms: 250 -microphone: motu +microphone: 0 model: turbo reset_after_silence_s: 15 transcription_loop_delay_ms: 100 use_cpu: 0 - block_width: 2 num_blocks: 40 rows: 10 cols: 24 - -- cgit v1.2.3