diff --git a/cosyvoice/utils/file_utils.py b/cosyvoice/utils/file_utils.py index 7700a9f..d4179e1 100644 --- a/cosyvoice/utils/file_utils.py +++ b/cosyvoice/utils/file_utils.py @@ -40,14 +40,14 @@ def load_wav(wav, target_sr): speech = torchaudio.transforms.Resample(orig_freq=sample_rate, new_freq=target_sr)(speech) return speech -def speed_change(waveform,sample_rate,speed_factor:str): +def speed_change(waveform, sample_rate, speed_factor: str): effects = [ - ["tempo",speed_factor], # speed_factor - ["rate", f"{sample_rate}"] + ["tempo", speed_factor], # speed_factor + ["rate", f"{sample_rate}"] ] augmented_waveform, new_sample_rate = torchaudio.sox_effects.apply_effects_tensor( - waveform, - sample_rate, + waveform, + sample_rate, effects ) return augmented_waveform, new_sample_rate