From 912920c591085b3ae361b842365a4563de410fc9 Mon Sep 17 00:00:00 2001 From: Jan Panoch Date: Wed, 7 Aug 2024 10:05:17 +0200 Subject: [PATCH 1/5] Update alignment.py - added alignment for sk and sl languages --- whisperx/alignment.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index 8294983..e030610 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -55,6 +55,8 @@ DEFAULT_ALIGN_MODELS_HF = { "ml": "gvs/wav2vec2-large-xlsr-malayalam", "no": "NbAiLab/nb-wav2vec2-1b-bokmaal", "nn": "NbAiLab/nb-wav2vec2-300m-nynorsk", + "sk": "comodoro/wav2vec2-xls-r-300m-sk-cv8", + "sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", } From 6f70aa6bebefdfde9334da3856df2a58c6a14d45 Mon Sep 17 00:00:00 2001 From: Jan Panoch Date: Thu, 8 Aug 2024 08:10:55 +0200 Subject: [PATCH 2/5] Update alignment.py - added croatian (hr) language --- whisperx/alignment.py | 1 + 1 file changed, 1 insertion(+) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index e030610..4d81c0d 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -57,6 +57,7 @@ DEFAULT_ALIGN_MODELS_HF = { "nn": "NbAiLab/nb-wav2vec2-300m-nynorsk", "sk": "comodoro/wav2vec2-xls-r-300m-sk-cv8", "sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", + "hr": "classla/wav2vec2-large-slavic-parlaspeech-hr-lm", } From 59b4d88d1dd2c828c22967cad2bbbf88090adbef Mon Sep 17 00:00:00 2001 From: Jan Panoch Date: Thu, 8 Aug 2024 08:29:11 +0200 Subject: [PATCH 3/5] Update alignment.py - trying another hr alignment file --- whisperx/alignment.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index 4d81c0d..5507d59 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -57,7 +57,8 @@ DEFAULT_ALIGN_MODELS_HF = { "nn": "NbAiLab/nb-wav2vec2-300m-nynorsk", "sk": "comodoro/wav2vec2-xls-r-300m-sk-cv8", "sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", - "hr": "classla/wav2vec2-large-slavic-parlaspeech-hr-lm", +# "hr": "classla/wav2vec2-large-slavic-parlaspeech-hr-lm", + "hr": "facebook/wav2vec2-base-hr-voxpopuli-v2", } From 9a9b6171e6393c4bc6f287c85ab1aaa83deb4ff0 Mon Sep 17 00:00:00 2001 From: Jan Panoch Date: Thu, 8 Aug 2024 08:37:55 +0200 Subject: [PATCH 4/5] Update alignment.py - trying another hr alignment --- whisperx/alignment.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index 5507d59..829c721 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -58,7 +58,8 @@ DEFAULT_ALIGN_MODELS_HF = { "sk": "comodoro/wav2vec2-xls-r-300m-sk-cv8", "sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", # "hr": "classla/wav2vec2-large-slavic-parlaspeech-hr-lm", - "hr": "facebook/wav2vec2-base-hr-voxpopuli-v2", + "hr": "classla/wav2vec2-xls-r-parlaspeech-hr", +# "hr": "facebook/wav2vec2-base-hr-voxpopuli-v2", } From 3f339f95159a2032e84651f8915135015bec7dd4 Mon Sep 17 00:00:00 2001 From: Jan Panoch Date: Fri, 9 Aug 2024 13:00:12 +0200 Subject: [PATCH 5/5] Update alignment.py - remove commented-out alignment modules for hr language --- whisperx/alignment.py | 2 -- 1 file changed, 2 deletions(-) diff --git a/whisperx/alignment.py b/whisperx/alignment.py index 829c721..964217e 100644 --- a/whisperx/alignment.py +++ b/whisperx/alignment.py @@ -57,9 +57,7 @@ DEFAULT_ALIGN_MODELS_HF = { "nn": "NbAiLab/nb-wav2vec2-300m-nynorsk", "sk": "comodoro/wav2vec2-xls-r-300m-sk-cv8", "sl": "anton-l/wav2vec2-large-xlsr-53-slovenian", -# "hr": "classla/wav2vec2-large-slavic-parlaspeech-hr-lm", "hr": "classla/wav2vec2-xls-r-parlaspeech-hr", -# "hr": "facebook/wav2vec2-base-hr-voxpopuli-v2", }