fx end of chunk may exceed audio length

This commit is contained in:
adamnsandle
2022-06-02 10:39:16 +00:00
parent bf0127e016
commit 8eba346bc9

View File

@@ -252,8 +252,8 @@ def get_speech_timestamps(audio: torch.Tensor,
speech['end'] += int(silence_duration // 2)
speeches[i+1]['start'] = int(max(0, speeches[i+1]['start'] - silence_duration // 2))
else:
speech['end'] += int(speech_pad_samples)
speeches[i+1]['start'] -= int(speech_pad_samples)
speech['end'] = int(min(audio_length_samples, speech['end'] + speech_pad_samples))
speeches[i+1]['start'] = int(max(0, speeches[i+1]['start'] - speech_pad_samples))
else:
speech['end'] = int(min(audio_length_samples, speech['end'] + speech_pad_samples))