diff --git a/utils_vad.py b/utils_vad.py index 72e91e6..d80b798 100644 --- a/utils_vad.py +++ b/utils_vad.py @@ -239,10 +239,9 @@ def get_speech_timestamps(audio: torch.Tensor, triggered = False continue - if current_speech: - if (audio_length_samples - current_speech['start']) > min_speech_samples: - current_speech['end'] = audio_length_samples - speeches.append(current_speech) + if current_speech and (audio_length_samples - current_speech['start']) > min_speech_samples: + current_speech['end'] = audio_length_samples + speeches.append(current_speech) for i, speech in enumerate(speeches): if i == 0: