summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--Fonts/Bitmaps/font-ascii.pngbin543838 -> 962256 bytes
-rw-r--r--GUI/GUI/GUI/Config.cpp2
-rw-r--r--GUI/GUI/GUI/Frame.cpp2
-rw-r--r--Scripts/generate_fonts.py6
-rw-r--r--Scripts/transcribe_v2.py9
5 files changed, 11 insertions, 8 deletions
diff --git a/Fonts/Bitmaps/font-ascii.png b/Fonts/Bitmaps/font-ascii.png
index 1a8ba99..098d651 100644
--- a/Fonts/Bitmaps/font-ascii.png
+++ b/Fonts/Bitmaps/font-ascii.png
Binary files differ
diff --git a/GUI/GUI/GUI/Config.cpp b/GUI/GUI/GUI/Config.cpp
index 2abe5b2..a92502d 100644
--- a/GUI/GUI/GUI/Config.cpp
+++ b/GUI/GUI/GUI/Config.cpp
@@ -87,7 +87,7 @@ AppConfig::AppConfig(wxTextCtrl* out)
enable_lock_at_spawn(true),
gpu_idx(0),
min_silence_duration_ms(250),
- max_speech_duration_s(5),
+ max_speech_duration_s(15),
reset_after_silence_s(10),
transcription_loop_delay_ms(100),
keybind("ctrl+x"),
diff --git a/GUI/GUI/GUI/Frame.cpp b/GUI/GUI/GUI/Frame.cpp
index 0c83742..8e4eb6d 100644
--- a/GUI/GUI/GUI/Frame.cpp
+++ b/GUI/GUI/GUI/Frame.cpp
@@ -119,7 +119,9 @@ namespace {
const wxString kMicChoices[] = {
"index",
+ "beyond",
"focusrite",
+ "motu",
// ok now this is epic
"0",
"1",
diff --git a/Scripts/generate_fonts.py b/Scripts/generate_fonts.py
index cf73e6a..8dc8a89 100644
--- a/Scripts/generate_fonts.py
+++ b/Scripts/generate_fonts.py
@@ -155,7 +155,7 @@ def genUnicode():
def genASCII():
# Create an 8k grayscale image. 16 glyphs wide, 8 glyphs tall.
# Only characters on the range [0, 128).
- image = Image.new(mode="L", size=(8192,8192), color=0)
+ image = Image.new(mode="RGBA", size=(8192,8192), color=0)
draw = ImageDraw.Draw(image)
n_rows = 8
n_cols = 16
@@ -174,11 +174,11 @@ def genASCII():
else:
char = " "
draw.text((col * font_pixels * 8 / 2, row * font_pixels * 8 - 20),
- char, font=font, fill=255)
+ char, font=font, fill=(255,255,255))
image.save("Fonts/Bitmaps/font-ascii.png")
if __name__ == "__main__":
print("Generating unicode fonts")
- genUnicode()
+ #genUnicode()
print("Generating ASCII fonts")
genASCII()
diff --git a/Scripts/transcribe_v2.py b/Scripts/transcribe_v2.py
index 491bc35..65a0cf8 100644
--- a/Scripts/transcribe_v2.py
+++ b/Scripts/transcribe_v2.py
@@ -337,7 +337,7 @@ class AudioSegmenter:
# Returns the stable cutoff (if any) and whether there are any segments.
def getStableCutoff(self, audio: bytes) -> typing.Tuple[int, bool]:
min_delta_frames = int((self.vad_options.min_silence_duration_ms *
- AudioStream.FPS) / 1000)
+ AudioStream.FPS) / 1000.0)
cutoff = None
last_end = None
@@ -515,9 +515,10 @@ class VadCommitter:
print(f"commit segment: {s}", file=sys.stderr)
print(f"delta get: {delta}", file=sys.stderr)
- #ts = datetime.fromtimestamp(self.collector.now() - latency_s)
- #filename = str(ts.strftime('%Y_%m_%d__%H-%M-%S')) + ".wav"
- #saveAudio(commit_audio, filename)
+ if True:
+ ts = datetime.fromtimestamp(self.collector.now() - latency_s)
+ filename = str(ts.strftime('%Y_%m_%d__%H-%M-%S')) + ".wav"
+ saveAudio(commit_audio, filename)
preview = ""
if self.cfg["enable_previews"] and has_audio: