diff options
Diffstat (limited to 'Scripts')
| -rw-r--r-- | Scripts/requirements.txt | 3 | ||||
| -rw-r--r-- | Scripts/requirements_frozen.txt | 41 | ||||
| -rw-r--r-- | Scripts/transcribe_v2.py | 8 |
3 files changed, 48 insertions, 4 deletions
diff --git a/Scripts/requirements.txt b/Scripts/requirements.txt index d694f4a..9224ba8 100644 --- a/Scripts/requirements.txt +++ b/Scripts/requirements.txt @@ -2,6 +2,7 @@ ctranslate2 editdistance faster-whisper@https://github.com/guillaumekln/faster-whisper/archive/78d57d73c5b4a76b32d1d5a415e4e7aea760295c.tar.gz future==0.18.2 +huggingface_hub==0.16.4 keyboard langcodes language-data @@ -14,5 +15,3 @@ pyyaml sentence_splitter transformers>=4.21.0 -git+https://github.com/openai/whisper.git -scipy diff --git a/Scripts/requirements_frozen.txt b/Scripts/requirements_frozen.txt new file mode 100644 index 0000000..dd56b9d --- /dev/null +++ b/Scripts/requirements_frozen.txt @@ -0,0 +1,41 @@ +av==10.0.0 +certifi==2023.7.22 +charset-normalizer==3.2.0 +colorama==0.4.6 +coloredlogs==15.0.1 +ctranslate2==3.19.0 +editdistance==0.6.2 +faster-whisper @ https://github.com/guillaumekln/faster-whisper/archive/78d57d73c5b4a76b32d1d5a415e4e7aea760295c.tar.gz#sha256=824b441278d59fb7daff99f98823d492762e279980922308a2e0833ac8e49c5c +filelock==3.12.3 +flatbuffers==23.5.26 +fsspec==2023.9.0 +future==0.18.2 +huggingface-hub==0.16.4 +humanfriendly==10.0 +idna==3.4 +keyboard==0.13.5 +langcodes==3.3.0 +language-data==1.1 +marisa-trie==0.7.8 +mpmath==1.3.0 +numpy==1.25.2 +onnxruntime==1.14.1 +openvr==1.26.701 +packaging==23.1 +Pillow==10.0.0 +protobuf==4.24.3 +PyAudio==0.2.13 +pydub==0.25.1 +pyreadline3==3.4.1 +python-osc==1.8.3 +PyYAML==6.0.1 +regex==2023.8.8 +requests==2.31.0 +safetensors==0.3.3 +sentence-splitter==1.4 +sympy==1.12 +tokenizers==0.13.3 +tqdm==4.66.1 +transformers==4.33.1 +typing_extensions==4.7.1 +urllib3==2.0.4 diff --git a/Scripts/transcribe_v2.py b/Scripts/transcribe_v2.py index 6377ff4..9eed78f 100644 --- a/Scripts/transcribe_v2.py +++ b/Scripts/transcribe_v2.py @@ -4,9 +4,7 @@ from faster_whisper import WhisperModel from functools import partial from profanity_filter import ProfanityFilter from pydub import AudioSegment -from scipy.optimize import minimize from sentence_splitter import split_text_into_sentences -from whisper.normalizers import EnglishTextNormalizer import app_config import argparse @@ -814,6 +812,12 @@ def evaluate(cfg, def optimize(cfg, experiments: typing.List[typing.Tuple[str, str]]): + install_in_venv(["git+https://github.com/openai/whisper.git", + "scipy"]) + + from scipy.optimize import minimize + from whisper.normalizers import EnglishTextNormalizer + def wrapper_to_optimize(x): s = 0 for audio_path, control_path in experiments: |
