mirror of
https://github.com/FunAudioLLM/CosyVoice.git
synced 2026-02-05 18:09:24 +08:00
add prompt contraint
This commit is contained in:
@@ -78,6 +78,7 @@ class CosyVoiceFrontEnd:
|
|||||||
return text_token, text_token_len
|
return text_token, text_token_len
|
||||||
|
|
||||||
def _extract_speech_token(self, speech):
|
def _extract_speech_token(self, speech):
|
||||||
|
assert speech.shape[1] / 16000 <= 30, 'do not support extract speech token for audio longer than 30s'
|
||||||
feat = whisper.log_mel_spectrogram(speech, n_mels=128)
|
feat = whisper.log_mel_spectrogram(speech, n_mels=128)
|
||||||
speech_token = self.speech_tokenizer_session.run(None,
|
speech_token = self.speech_tokenizer_session.run(None,
|
||||||
{self.speech_tokenizer_session.get_inputs()[0].name:
|
{self.speech_tokenizer_session.get_inputs()[0].name:
|
||||||
|
|||||||
Reference in New Issue
Block a user