summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authoryum <yum.food.vr@gmail.com>2023-02-19 11:46:43 -0800
committeryum <yum.food.vr@gmail.com>2023-02-19 12:10:13 -0800
commit52f743e43a9ef582e04d7a363fbda19824db6cc7 (patch)
treec3493a0feb31f4d0bcf07b31a8f1c6bdf1dfd38b
parentbd72a8e97e120604405f2330664e9658e44e3de1 (diff)
Remove exponential backoff capv0.7.0
Allows sustained exponential backoff when not transcribing. Used to cap out at 1s. * Add more items to README TODO list * Adjust emote metadata * Emotes bugfix: Non-existent emote map doesn't cause transcription engine to bail out.
-rw-r--r--Fonts/Bitmaps/emotes.png.meta20
-rw-r--r--README.md6
-rw-r--r--Scripts/emotes_v2.py8
-rw-r--r--Scripts/transcribe.py3
4 files changed, 23 insertions, 14 deletions
diff --git a/Fonts/Bitmaps/emotes.png.meta b/Fonts/Bitmaps/emotes.png.meta
index c2bc609..1e794cb 100644
--- a/Fonts/Bitmaps/emotes.png.meta
+++ b/Fonts/Bitmaps/emotes.png.meta
@@ -39,7 +39,7 @@ TextureImporter:
wrapW: 1
nPOTScale: 1
lightmap: 0
- compressionQuality: 50
+ compressionQuality: 100
spriteMode: 0
spriteExtrude: 1
spriteMeshType: 1
@@ -61,11 +61,11 @@ TextureImporter:
platformSettings:
- serializedVersion: 3
buildTarget: DefaultTexturePlatform
- maxTextureSize: 4096
- resizeAlgorithm: 0
+ maxTextureSize: 2048
+ resizeAlgorithm: 1
textureFormat: -1
textureCompression: 2
- compressionQuality: 50
+ compressionQuality: 100
crunchedCompression: 0
allowsAlphaSplitting: 0
overridden: 0
@@ -73,11 +73,11 @@ TextureImporter:
forceMaximumCompressionQuality_BC6H_BC7: 0
- serializedVersion: 3
buildTarget: Standalone
- maxTextureSize: 4096
- resizeAlgorithm: 0
+ maxTextureSize: 2048
+ resizeAlgorithm: 1
textureFormat: -1
textureCompression: 2
- compressionQuality: 50
+ compressionQuality: 100
crunchedCompression: 0
allowsAlphaSplitting: 0
overridden: 0
@@ -85,11 +85,11 @@ TextureImporter:
forceMaximumCompressionQuality_BC6H_BC7: 0
- serializedVersion: 3
buildTarget: Android
- maxTextureSize: 4096
- resizeAlgorithm: 0
+ maxTextureSize: 2048
+ resizeAlgorithm: 1
textureFormat: -1
textureCompression: 2
- compressionQuality: 50
+ compressionQuality: 100
crunchedCompression: 0
allowsAlphaSplitting: 0
overridden: 0
diff --git a/README.md b/README.md
index 322effe..ff4781e 100644
--- a/README.md
+++ b/README.md
@@ -200,6 +200,12 @@ Ping the discord if you need help getting set up.
8. ~~Customizable controller bindings. Someone mentioned they use left click
to unmute. Let's work around users, not make them change their existing
keybinds.~~ DONE
+ 9. One-click upgrade. Fetch latest stable release, copy over virtual env and
+ UI configs, relaunch.
+ 10. Browser source for OBS. Blocker: the transcription layer doesn't handle
+ long pauses well.
+ 11. Test suite. Some long representative transcripts with mechanical word
+ error rate (WER) calculation.
4. Optimization
1. ~~Utilize the avatar 3.0 SDK's ability to drive parameters to reduce the
total # of parameters (and therefore OSC messages & sync events). Note
diff --git a/Scripts/emotes_v2.py b/Scripts/emotes_v2.py
index 165db7c..aaf8d18 100644
--- a/Scripts/emotes_v2.py
+++ b/Scripts/emotes_v2.py
@@ -68,8 +68,12 @@ class EmotesState:
self.bits = {}
def load(self, pickle_path):
- with open(pickle_path, 'rb') as f:
- self.bits = pickle.load(f)
+ try:
+ with open(pickle_path, 'rb') as f:
+ self.bits = pickle.load(f)
+ except FileNotFoundError:
+ print(f"Emotes map does not exist at {pickle_path}",
+ file=sys.stderr)
# This is quite slow since we do a search and replace (O(n))
# for each keyword O(m) times each variant of said keyword (O(k)).
diff --git a/Scripts/transcribe.py b/Scripts/transcribe.py
index d67edb6..c4d7682 100644
--- a/Scripts/transcribe.py
+++ b/Scripts/transcribe.py
@@ -252,10 +252,9 @@ def transcribeAudio(audio_state, model, use_cpu: bool):
else:
time.sleep(0.05)
+ audio_state.transcribe_no_change_count += 1
# Increase sleep time. Code below will set sleep time back to minimum
# if a change is detected.
- if audio_state.transcribe_no_change_count < 10:
- audio_state.transcribe_no_change_count += 1
longer_sleep_dur = audio_state.transcribe_sleep_duration
longer_sleep_dur += audio_state.transcribe_sleep_duration_min_s * (1.3**audio_state.transcribe_no_change_count)
if audio_state.audio_paused: