diff --git a/utils_vad.py b/utils_vad.py index eccf618..d80b798 100644 --- a/utils_vad.py +++ b/utils_vad.py @@ -239,7 +239,7 @@ def get_speech_timestamps(audio: torch.Tensor, triggered = False continue - if current_speech: + if current_speech and (audio_length_samples - current_speech['start']) > min_speech_samples: current_speech['end'] = audio_length_samples speeches.append(current_speech)