From 45059246084a8a581c20e5b09dcda2c720da96b3 Mon Sep 17 00:00:00 2001 From: xxnuo <54252779+xxnuo@users.noreply.github.com> Date: Fri, 27 Jun 2025 14:43:57 +0800 Subject: [PATCH 1/6] Fix: Use wetext replace WeTextProcessing --- cosyvoice/cli/frontend.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/cosyvoice/cli/frontend.py b/cosyvoice/cli/frontend.py index 36dcd18..16ed551 100644 --- a/cosyvoice/cli/frontend.py +++ b/cosyvoice/cli/frontend.py @@ -28,9 +28,9 @@ try: import ttsfrd use_ttsfrd = True except ImportError: - print("failed to import ttsfrd, use WeTextProcessing instead") - from tn.chinese.normalizer import Normalizer as ZhNormalizer - from tn.english.normalizer import Normalizer as EnNormalizer + print("failed to import ttsfrd, use wetext instead") + from wetext import Normalizer as ZhNormalizer + from wetext import Normalizer as EnNormalizer use_ttsfrd = False from cosyvoice.utils.file_utils import logging from cosyvoice.utils.frontend_utils import contains_chinese, replace_blank, replace_corner_mark, remove_bracket, spell_out_number, split_paragraph, is_only_punctuation From ff9694dc2c224a781fb207210cb56d284781c5ea Mon Sep 17 00:00:00 2001 From: xxnuo <54252779+xxnuo@users.noreply.github.com> Date: Fri, 27 Jun 2025 14:45:07 +0800 Subject: [PATCH 2/6] Fix: Use wetext cache --- cosyvoice/cli/frontend.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cosyvoice/cli/frontend.py b/cosyvoice/cli/frontend.py index 16ed551..ec89b66 100644 --- a/cosyvoice/cli/frontend.py +++ b/cosyvoice/cli/frontend.py @@ -68,7 +68,7 @@ class CosyVoiceFrontEnd: 'failed to initialize ttsfrd resource' self.frd.set_lang_type('pinyinvg') else: - self.zh_tn_model = ZhNormalizer(remove_erhua=False, full_to_half=False, overwrite_cache=True) + self.zh_tn_model = ZhNormalizer(remove_erhua=False, full_to_half=False, overwrite_cache=False) self.en_tn_model = EnNormalizer() self.inflect_parser = inflect.engine() From c788bca1a631fd7b5b22dd8a88737b0d6142485d Mon Sep 17 00:00:00 2001 From: xxnuo <54252779+xxnuo@users.noreply.github.com> Date: Fri, 27 Jun 2025 14:50:35 +0800 Subject: [PATCH 3/6] Update requirements.txt --- requirements.txt | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/requirements.txt b/requirements.txt index fe48b20..782c1f7 100644 --- a/requirements.txt +++ b/requirements.txt @@ -36,5 +36,5 @@ torch==2.3.1 torchaudio==2.3.1 transformers==4.40.1 uvicorn==0.30.0 -WeTextProcessing==1.0.3 +wetext==0.0.4 wget==3.2 From 525531d8a3b76a4f6f0e70433e32ba233a29a0f9 Mon Sep 17 00:00:00 2001 From: xxnuo <54252779+xxnuo@users.noreply.github.com> Date: Fri, 27 Jun 2025 14:52:58 +0800 Subject: [PATCH 4/6] Update README.md --- README.md | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/README.md b/README.md index 2a2878a..870f853 100644 --- a/README.md +++ b/README.md @@ -69,8 +69,6 @@ ``` sh conda create -n cosyvoice -y python=3.10 conda activate cosyvoice - # pynini is required by WeTextProcessing, use conda to install it as it can be executed on all platforms. - conda install -y -c conda-forge pynini==2.1.5 pip install -r requirements.txt -i https://mirrors.aliyun.com/pypi/simple/ --trusted-host=mirrors.aliyun.com # If you encounter sox compatibility issues @@ -106,7 +104,7 @@ git clone https://www.modelscope.cn/iic/CosyVoice-ttsfrd.git pretrained_models/C Optionally, you can unzip `ttsfrd` resource and install `ttsfrd` package for better text normalization performance. -Notice that this step is not necessary. If you do not install `ttsfrd` package, we will use WeTextProcessing by default. +Notice that this step is not necessary. If you do not install `ttsfrd` package, we will use wetext by default. ``` sh cd pretrained_models/CosyVoice-ttsfrd/ From 6eaef42126b79c884a47a7fabd6f4f387d38c255 Mon Sep 17 00:00:00 2001 From: xxnuo <54252779+xxnuo@users.noreply.github.com> Date: Fri, 27 Jun 2025 15:55:00 +0800 Subject: [PATCH 5/6] Fix: remove full_to_half --- cosyvoice/cli/frontend.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cosyvoice/cli/frontend.py b/cosyvoice/cli/frontend.py index ec89b66..22daadd 100644 --- a/cosyvoice/cli/frontend.py +++ b/cosyvoice/cli/frontend.py @@ -68,7 +68,7 @@ class CosyVoiceFrontEnd: 'failed to initialize ttsfrd resource' self.frd.set_lang_type('pinyinvg') else: - self.zh_tn_model = ZhNormalizer(remove_erhua=False, full_to_half=False, overwrite_cache=False) + self.zh_tn_model = ZhNormalizer(remove_erhua=False, overwrite_cache=False) self.en_tn_model = EnNormalizer() self.inflect_parser = inflect.engine() From 116c99bf39e562d13b2fbc8cddde8137d6bdba15 Mon Sep 17 00:00:00 2001 From: xxnuo <54252779+xxnuo@users.noreply.github.com> Date: Fri, 27 Jun 2025 15:57:17 +0800 Subject: [PATCH 6/6] Fix: remove overwrite_cache --- cosyvoice/cli/frontend.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/cosyvoice/cli/frontend.py b/cosyvoice/cli/frontend.py index 22daadd..f98b0d6 100644 --- a/cosyvoice/cli/frontend.py +++ b/cosyvoice/cli/frontend.py @@ -68,7 +68,7 @@ class CosyVoiceFrontEnd: 'failed to initialize ttsfrd resource' self.frd.set_lang_type('pinyinvg') else: - self.zh_tn_model = ZhNormalizer(remove_erhua=False, overwrite_cache=False) + self.zh_tn_model = ZhNormalizer(remove_erhua=False) self.en_tn_model = EnNormalizer() self.inflect_parser = inflect.engine()