From 15ad5bf7df3089c020a77e164539f268a0ef16b5 Mon Sep 17 00:00:00 2001 From: Icaro Bombonato Date: Tue, 31 Dec 2024 06:41:09 -0300 Subject: [PATCH] feat: update versions for pyannote:3.3.2 and faster-whisper:1.1.0 (#936) * chore: bump faster-whisper to 1.1.0 * chore: bump pyannote to 3.3.2 * feat: add multilingual option in load_model function --------- Co-authored-by: Barabazs <31799121+Barabazs@users.noreply.github.com> --- requirements.txt | 2 +- setup.py | 2 +- whisperx/asr.py | 1 + 3 files changed, 3 insertions(+), 2 deletions(-) diff --git a/requirements.txt b/requirements.txt index caaa730..8f1aabd 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,6 +1,6 @@ torch>=2 torchaudio>=2 -faster-whisper==1.0.3 +faster-whisper==1.1.0 ctranslate2==4.4.0 transformers pandas diff --git a/setup.py b/setup.py index 2b11e7e..fa05870 100644 --- a/setup.py +++ b/setup.py @@ -21,7 +21,7 @@ setup( open(os.path.join(os.path.dirname(__file__), "requirements.txt")) ) ] - + [f"pyannote.audio==3.1.1"], + + [f"pyannote.audio==3.3.2"], entry_points={ "console_scripts": ["whisperx=whisperx.transcribe:cli"], }, diff --git a/whisperx/asr.py b/whisperx/asr.py index 234034e..e403040 100644 --- a/whisperx/asr.py +++ b/whisperx/asr.py @@ -319,6 +319,7 @@ def load_model(whisper_arch, "word_timestamps": False, "prepend_punctuations": "\"'“¿([{-", "append_punctuations": "\"'.。,,!!??::”)]}、", + "multilingual": model.model.is_multilingual, "suppress_numerals": False, "max_new_tokens": None, "clip_timestamps": None,