From bf0127e01673d845d0760e912713ed2876b8748d Mon Sep 17 00:00:00 2001 From: adamnsandle Date: Thu, 2 Jun 2022 10:32:32 +0000 Subject: [PATCH] fx get_speech ts start of an audio chunk pad --- utils_vad.py | 1 + 1 file changed, 1 insertion(+) diff --git a/utils_vad.py b/utils_vad.py index d80b798..b390cf6 100644 --- a/utils_vad.py +++ b/utils_vad.py @@ -253,6 +253,7 @@ def get_speech_timestamps(audio: torch.Tensor, speeches[i+1]['start'] = int(max(0, speeches[i+1]['start'] - silence_duration // 2)) else: speech['end'] += int(speech_pad_samples) + speeches[i+1]['start'] -= int(speech_pad_samples) else: speech['end'] = int(min(audio_length_samples, speech['end'] + speech_pad_samples))