add some warning if languages do not match

This commit is contained in:
briguetjo
2023-07-29 18:20:59 +02:00
parent d87f6268d0
commit 9d736dca1c

View File

@ -258,7 +258,10 @@ class FasterWhisperPipeline(Pipeline):
vad_segments = self.vad_model({"waveform": torch.from_numpy(audio).unsqueeze(0), "sample_rate": SAMPLE_RATE})
vad_segments = merge_chunks(vad_segments, 30)
if self.preset_language is None:
if self.preset_language is None or self.preset_language != language:
if self.preset_language is not None and language is not None and self.preset_language != language:
print(f"Preset language '{self.preset_language}' is different from the language {language} passed to the transcribe method.")
print(f"Overriding preset language with {language}.")
language = language or self.detect_language(audio)
task = task or "transcribe"
self.tokenizer = faster_whisper.tokenizer.Tokenizer(self.model.hf_tokenizer,