diff --git a/cosyvoice/cli/model.py b/cosyvoice/cli/model.py
index b589bcd..9903acb 100644
--- a/cosyvoice/cli/model.py
+++ b/cosyvoice/cli/model.py
@@ -411,7 +411,7 @@ class CosyVoice3Model(CosyVoice2Model):
         self.llm_end_dict = {}
         self.hift_cache_dict = {}
         # FSQ silent token
-        self.silent_tokens = [28, 29]
+        self.silent_tokens = [2, 28, 29]
 
     def token2wav(self, token, prompt_token, prompt_feat, embedding, token_offset, uuid, stream=False, finalize=False, speed=1.0):
         with torch.cuda.amp.autocast(self.fp16):