From da6ed83dc98c18256dcd27942d8d211f810c53c0 Mon Sep 17 00:00:00 2001 From: Dudu Asulin <46293514+davidas1@users.noreply.github.com> Date: Wed, 2 Aug 2023 10:34:42 +0300 Subject: [PATCH] more --- whisperx/diarize.py | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/whisperx/diarize.py b/whisperx/diarize.py index 2a9bd69..eae6a19 100644 --- a/whisperx/diarize.py +++ b/whisperx/diarize.py @@ -4,7 +4,7 @@ from pyannote.audio import Pipeline from typing import Optional, Union import torch -from .audio import SAMPLE_RATE +from .audio import load_audio, SAMPLE_RATE class DiarizationPipeline: def __init__( @@ -18,6 +18,8 @@ class DiarizationPipeline: self.model = Pipeline.from_pretrained(model_name, use_auth_token=use_auth_token).to(device) def __call__(self, audio, min_speakers=None, max_speakers=None): + if isinstance(audio, str): + audio = load_audio(audio) audio_data = { 'waveform': torch.from_numpy(audio[None, :]), 'sample_rate': SAMPLE_RATE