diff options
| author | yum <yum.food.vr@gmail.com> | 2023-02-19 11:46:43 -0800 |
|---|---|---|
| committer | yum <yum.food.vr@gmail.com> | 2023-02-19 12:10:13 -0800 |
| commit | 52f743e43a9ef582e04d7a363fbda19824db6cc7 (patch) | |
| tree | c3493a0feb31f4d0bcf07b31a8f1c6bdf1dfd38b | |
| parent | bd72a8e97e120604405f2330664e9658e44e3de1 (diff) | |
Remove exponential backoff capv0.7.0
Allows sustained exponential backoff when not transcribing. Used to cap
out at 1s.
* Add more items to README TODO list
* Adjust emote metadata
* Emotes bugfix: Non-existent emote map doesn't cause transcription
engine to bail out.
| -rw-r--r-- | Fonts/Bitmaps/emotes.png.meta | 20 | ||||
| -rw-r--r-- | README.md | 6 | ||||
| -rw-r--r-- | Scripts/emotes_v2.py | 8 | ||||
| -rw-r--r-- | Scripts/transcribe.py | 3 |
4 files changed, 23 insertions, 14 deletions
diff --git a/Fonts/Bitmaps/emotes.png.meta b/Fonts/Bitmaps/emotes.png.meta index c2bc609..1e794cb 100644 --- a/Fonts/Bitmaps/emotes.png.meta +++ b/Fonts/Bitmaps/emotes.png.meta @@ -39,7 +39,7 @@ TextureImporter: wrapW: 1 nPOTScale: 1 lightmap: 0 - compressionQuality: 50 + compressionQuality: 100 spriteMode: 0 spriteExtrude: 1 spriteMeshType: 1 @@ -61,11 +61,11 @@ TextureImporter: platformSettings: - serializedVersion: 3 buildTarget: DefaultTexturePlatform - maxTextureSize: 4096 - resizeAlgorithm: 0 + maxTextureSize: 2048 + resizeAlgorithm: 1 textureFormat: -1 textureCompression: 2 - compressionQuality: 50 + compressionQuality: 100 crunchedCompression: 0 allowsAlphaSplitting: 0 overridden: 0 @@ -73,11 +73,11 @@ TextureImporter: forceMaximumCompressionQuality_BC6H_BC7: 0 - serializedVersion: 3 buildTarget: Standalone - maxTextureSize: 4096 - resizeAlgorithm: 0 + maxTextureSize: 2048 + resizeAlgorithm: 1 textureFormat: -1 textureCompression: 2 - compressionQuality: 50 + compressionQuality: 100 crunchedCompression: 0 allowsAlphaSplitting: 0 overridden: 0 @@ -85,11 +85,11 @@ TextureImporter: forceMaximumCompressionQuality_BC6H_BC7: 0 - serializedVersion: 3 buildTarget: Android - maxTextureSize: 4096 - resizeAlgorithm: 0 + maxTextureSize: 2048 + resizeAlgorithm: 1 textureFormat: -1 textureCompression: 2 - compressionQuality: 50 + compressionQuality: 100 crunchedCompression: 0 allowsAlphaSplitting: 0 overridden: 0 @@ -200,6 +200,12 @@ Ping the discord if you need help getting set up. 8. ~~Customizable controller bindings. Someone mentioned they use left click to unmute. Let's work around users, not make them change their existing keybinds.~~ DONE + 9. One-click upgrade. Fetch latest stable release, copy over virtual env and + UI configs, relaunch. + 10. Browser source for OBS. Blocker: the transcription layer doesn't handle + long pauses well. + 11. Test suite. Some long representative transcripts with mechanical word + error rate (WER) calculation. 4. Optimization 1. ~~Utilize the avatar 3.0 SDK's ability to drive parameters to reduce the total # of parameters (and therefore OSC messages & sync events). Note diff --git a/Scripts/emotes_v2.py b/Scripts/emotes_v2.py index 165db7c..aaf8d18 100644 --- a/Scripts/emotes_v2.py +++ b/Scripts/emotes_v2.py @@ -68,8 +68,12 @@ class EmotesState: self.bits = {} def load(self, pickle_path): - with open(pickle_path, 'rb') as f: - self.bits = pickle.load(f) + try: + with open(pickle_path, 'rb') as f: + self.bits = pickle.load(f) + except FileNotFoundError: + print(f"Emotes map does not exist at {pickle_path}", + file=sys.stderr) # This is quite slow since we do a search and replace (O(n)) # for each keyword O(m) times each variant of said keyword (O(k)). diff --git a/Scripts/transcribe.py b/Scripts/transcribe.py index d67edb6..c4d7682 100644 --- a/Scripts/transcribe.py +++ b/Scripts/transcribe.py @@ -252,10 +252,9 @@ def transcribeAudio(audio_state, model, use_cpu: bool): else: time.sleep(0.05) + audio_state.transcribe_no_change_count += 1 # Increase sleep time. Code below will set sleep time back to minimum # if a change is detected. - if audio_state.transcribe_no_change_count < 10: - audio_state.transcribe_no_change_count += 1 longer_sleep_dur = audio_state.transcribe_sleep_duration longer_sleep_dur += audio_state.transcribe_sleep_duration_min_s * (1.3**audio_state.transcribe_no_change_count) if audio_state.audio_paused: |
