From 88c27d7b99f5f8d06d88daa7971a56ac6ebbc0ed Mon Sep 17 00:00:00 2001 From: boocmp Date: Mon, 19 Aug 2024 14:59:51 +0700 Subject: [PATCH] wav2vec2 backend + padding. --- src/runners/audio_transcriber.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/runners/audio_transcriber.py b/src/runners/audio_transcriber.py index fa6d7b5..ce75782 100644 --- a/src/runners/audio_transcriber.py +++ b/src/runners/audio_transcriber.py @@ -187,7 +187,7 @@ def __init__(self): def transcribe(self, audios): input_values = self.processor( - audios, return_tensors="pt", sampling_rate=16000 + audios, return_tensors="pt", sampling_rate=16000, padding=True ).input_values.cuda() with torch.no_grad():