mirror of
https://github.com/m-bain/whisperX.git
synced 2025-07-01 18:17:27 -04:00
add tokenizer is None case
This commit is contained in:
@ -228,7 +228,10 @@ class FasterWhisperPipeline(Pipeline):
|
|||||||
|
|
||||||
vad_segments = self.vad_model({"waveform": torch.from_numpy(audio).unsqueeze(0), "sample_rate": SAMPLE_RATE})
|
vad_segments = self.vad_model({"waveform": torch.from_numpy(audio).unsqueeze(0), "sample_rate": SAMPLE_RATE})
|
||||||
vad_segments = merge_chunks(vad_segments, 30)
|
vad_segments = merge_chunks(vad_segments, 30)
|
||||||
|
if self.tokenizer is None:
|
||||||
|
language = language or self.detect_language(audio)
|
||||||
|
task = task or "transcribe"
|
||||||
|
else:
|
||||||
language = language or self.tokenizer.language_code
|
language = language or self.tokenizer.language_code
|
||||||
task = task or self.tokenizer.task
|
task = task or self.tokenizer.task
|
||||||
if task != self.tokenizer.task or language != self.tokenizer.language_code:
|
if task != self.tokenizer.task or language != self.tokenizer.language_code:
|
||||||
|
Reference in New Issue
Block a user