From a49799294bd13113edb508e51f0df9b0b24379dd Mon Sep 17 00:00:00 2001 From: Mahmoud Ashraf <32404268+MahmoudAshraf97@users.noreply.github.com> Date: Tue, 31 Jan 2023 19:07:48 +0200 Subject: [PATCH 1/3] add arabic wav2vec2 model form elgeish --- whisperx/alignment.py | 1 + 1 file changed, 1 insertion(+) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index e4950f9..5549d8b 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -29,6 +29,7 @@ DEFAULT_ALIGN_MODELS_HF = { "nl": "jonatasgrosman/wav2vec2-large-xlsr-53-dutch", "uk": "Yehor/wav2vec2-xls-r-300m-uk-with-small-lm", "pt": "jonatasgrosman/wav2vec2-large-xlsr-53-portuguese", + "ar": "elgeish/wav2vec2-large-xlsr-53-arabic", } From 1b08661e42acb8a9210cabdcdc3afa3889f7aa9a Mon Sep 17 00:00:00 2001 From: Mahmoud Ashraf <32404268+MahmoudAshraf97@users.noreply.github.com> Date: Tue, 31 Jan 2023 19:32:31 +0200 Subject: [PATCH 2/3] change arabic model to jonatasgrosman --- whisperx/alignment.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index 5549d8b..ea97d8c 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -29,7 +29,7 @@ DEFAULT_ALIGN_MODELS_HF = { "nl": "jonatasgrosman/wav2vec2-large-xlsr-53-dutch", "uk": "Yehor/wav2vec2-xls-r-300m-uk-with-small-lm", "pt": "jonatasgrosman/wav2vec2-large-xlsr-53-portuguese", - "ar": "elgeish/wav2vec2-large-xlsr-53-arabic", + "ar": "jonatasgrosman/wav2vec2-large-xlsr-53-arabic", } From 0eae9e1f50d174e6f6f14c1ecfb92807ec1dc16c Mon Sep 17 00:00:00 2001 From: Mahmoud Ashraf <32404268+MahmoudAshraf97@users.noreply.github.com> Date: Wed, 1 Feb 2023 03:02:10 +0200 Subject: [PATCH 3/3] added several wav2vec2 models by jonatasgrosman since his models were used in other languages before and I tested the arabic model myself, I assumed it's safe to include all the available models --- whisperx/alignment.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index ea97d8c..fd92d9e 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -30,6 +30,12 @@ DEFAULT_ALIGN_MODELS_HF = { "uk": "Yehor/wav2vec2-xls-r-300m-uk-with-small-lm", "pt": "jonatasgrosman/wav2vec2-large-xlsr-53-portuguese", "ar": "jonatasgrosman/wav2vec2-large-xlsr-53-arabic", + "ru": "jonatasgrosman/wav2vec2-large-xlsr-53-russian", + "pl": "jonatasgrosman/wav2vec2-large-xlsr-53-polish", + "hu": "jonatasgrosman/wav2vec2-large-xlsr-53-hungarian", + "fi": "jonatasgrosman/wav2vec2-large-xlsr-53-finnish", + "fa": "jonatasgrosman/wav2vec2-large-xlsr-53-persian", + "el": "jonatasgrosman/wav2vec2-large-xlsr-53-greek", }