summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--GUI/GUI/GUI/Frame.cpp2
-rw-r--r--Scripts/requirements.txt3
-rw-r--r--Scripts/requirements_frozen.txt41
-rw-r--r--Scripts/transcribe_v2.py8
4 files changed, 49 insertions, 5 deletions
diff --git a/GUI/GUI/GUI/Frame.cpp b/GUI/GUI/GUI/Frame.cpp
index 273423e..0d30809 100644
--- a/GUI/GUI/GUI/Frame.cpp
+++ b/GUI/GUI/GUI/Frame.cpp
@@ -1789,7 +1789,7 @@ void Frame::EnsureVirtualEnv(bool block, bool force)
"-u", // Unbuffered output
"-m pip",
"install",
- "-r Resources/Scripts/requirements.txt",
+ "-r Resources/Scripts/requirements_frozen.txt",
}, std::move(out_cb))) {
Log(transcribe_out_, "Failed to launch environment setup thread!\n");
return false;
diff --git a/Scripts/requirements.txt b/Scripts/requirements.txt
index d694f4a..9224ba8 100644
--- a/Scripts/requirements.txt
+++ b/Scripts/requirements.txt
@@ -2,6 +2,7 @@ ctranslate2
editdistance
faster-whisper@https://github.com/guillaumekln/faster-whisper/archive/78d57d73c5b4a76b32d1d5a415e4e7aea760295c.tar.gz
future==0.18.2
+huggingface_hub==0.16.4
keyboard
langcodes
language-data
@@ -14,5 +15,3 @@ pyyaml
sentence_splitter
transformers>=4.21.0
-git+https://github.com/openai/whisper.git
-scipy
diff --git a/Scripts/requirements_frozen.txt b/Scripts/requirements_frozen.txt
new file mode 100644
index 0000000..dd56b9d
--- /dev/null
+++ b/Scripts/requirements_frozen.txt
@@ -0,0 +1,41 @@
+av==10.0.0
+certifi==2023.7.22
+charset-normalizer==3.2.0
+colorama==0.4.6
+coloredlogs==15.0.1
+ctranslate2==3.19.0
+editdistance==0.6.2
+faster-whisper @ https://github.com/guillaumekln/faster-whisper/archive/78d57d73c5b4a76b32d1d5a415e4e7aea760295c.tar.gz#sha256=824b441278d59fb7daff99f98823d492762e279980922308a2e0833ac8e49c5c
+filelock==3.12.3
+flatbuffers==23.5.26
+fsspec==2023.9.0
+future==0.18.2
+huggingface-hub==0.16.4
+humanfriendly==10.0
+idna==3.4
+keyboard==0.13.5
+langcodes==3.3.0
+language-data==1.1
+marisa-trie==0.7.8
+mpmath==1.3.0
+numpy==1.25.2
+onnxruntime==1.14.1
+openvr==1.26.701
+packaging==23.1
+Pillow==10.0.0
+protobuf==4.24.3
+PyAudio==0.2.13
+pydub==0.25.1
+pyreadline3==3.4.1
+python-osc==1.8.3
+PyYAML==6.0.1
+regex==2023.8.8
+requests==2.31.0
+safetensors==0.3.3
+sentence-splitter==1.4
+sympy==1.12
+tokenizers==0.13.3
+tqdm==4.66.1
+transformers==4.33.1
+typing_extensions==4.7.1
+urllib3==2.0.4
diff --git a/Scripts/transcribe_v2.py b/Scripts/transcribe_v2.py
index 6377ff4..9eed78f 100644
--- a/Scripts/transcribe_v2.py
+++ b/Scripts/transcribe_v2.py
@@ -4,9 +4,7 @@ from faster_whisper import WhisperModel
from functools import partial
from profanity_filter import ProfanityFilter
from pydub import AudioSegment
-from scipy.optimize import minimize
from sentence_splitter import split_text_into_sentences
-from whisper.normalizers import EnglishTextNormalizer
import app_config
import argparse
@@ -814,6 +812,12 @@ def evaluate(cfg,
def optimize(cfg,
experiments: typing.List[typing.Tuple[str, str]]):
+ install_in_venv(["git+https://github.com/openai/whisper.git",
+ "scipy"])
+
+ from scipy.optimize import minimize
+ from whisper.normalizers import EnglishTextNormalizer
+
def wrapper_to_optimize(x):
s = 0
for audio_path, control_path in experiments: