vad filter

This commit is contained in:
Max Bain
2023-01-20 12:54:20 +00:00
parent 78c87d3bfd
commit ba102feb7f
3 changed files with 185 additions and 12 deletions

View File

@ -116,14 +116,14 @@ audio_file = "audio.mp3"
model = whisperx.load_model("large", device)
result = model.transcribe(audio_file)
print(result["segments"]) # before alignment
# load alignment model and metadata
model_a, metadata = whisperx.load_align_model(language_code=result["language"], device=device)
# align whisper output
result_aligned = whisperx.align(result["segments"], model_a, metadata, audio_file, device)
print(result["segments"]) # before alignment
print(result_aligned["segments"]) # after alignment
print(result_aligned["word_segments"]) # after alignment
```