From f21c4764ecb04cd5108252802c568f452fe2d576 Mon Sep 17 00:00:00 2001
From: "lyuxiang.lx" <lyuxiang.lx@alibaba-inc.com>
Date: Thu, 11 Dec 2025 06:04:36 +0000
Subject: [PATCH] fix bug

---
 cosyvoice/llm/llm.py      |  2 +-
 cosyvoice/utils/common.py | 52 +++++++++++++++++++--------------------
 2 files changed, 27 insertions(+), 27 deletions(-)
diff --git a/cosyvoice/llm/llm.py b/cosyvoice/llm/llm.py
index a343ce4..6b3a7b0 100644
--- a/cosyvoice/llm/llm.py
+++ b/cosyvoice/llm/llm.py
@@ -604,7 +604,7 @@ class Qwen2LM(TransformerLM):
                                                       masks=torch.tril(torch.ones((1, seq_len, seq_len), device=lm_input.device)).to(torch.bool),
                                                       cache=cache)
             logp = self.llm_decoder(y_pred[:, -1]).log_softmax(dim=-1)
-            top_ids = self.sampling_ids(logp.squeeze(dim=0), out_tokens, sampling, ignore_eos=False).item()
+            top_ids = self.sampling_ids(logp.squeeze(dim=0), out_tokens, sampling, ignore_eos=False)
             out_tokens.append(top_ids)
             if top_ids >= self.speech_token_size:
                 if top_ids == self.eos_token:
diff --git a/cosyvoice/utils/common.py b/cosyvoice/utils/common.py
index 8afe308..5d307ae 100644
--- a/cosyvoice/utils/common.py
+++ b/cosyvoice/utils/common.py
@@ -25,32 +25,32 @@ import torch
 
 IGNORE_ID = -1
 
-instruct_list = ["You are a helpful assistant. 请用广东话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用东北话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用甘肃话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用贵州话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用河南话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用湖北话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用湖南话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用江西话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用闽南话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用宁夏话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用山西话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用陕西话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用山东话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用上海话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用四川话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用天津话表达。<endofprompt>",
-                 "You are a helpful assistant. 请用云南话表达。<endofprompt>",
-                 "You are a helpful assistant. Please say a sentence as loudly as possible.<endofprompt>",
-                 "You are a helpful assistant. Please say a sentence in a very soft voice.<endofprompt>",
-                 "You are a helpful assistant. 请用尽可能慢地语速说一句话。<endofprompt>",
-                 "You are a helpful assistant. 请用尽可能快地语速说一句话。<endofprompt>",
-                 "You are a helpful assistant. 请非常开心地说一句话。<endofprompt>",
-                 "You are a helpful assistant. 请非常伤心地说一句话。<endofprompt>",
-                 "You are a helpful assistant. 请非常生气地说一句话。<endofprompt>",
-                 "You are a helpful assistant. 我想体验一下小猪佩奇风格，可以吗？<endofprompt>",
-                 "You are a helpful assistant. 你可以尝试用机器人的方式解答吗？<endofprompt>"]
+instruct_list = ["You are a helpful assistant. 请用广东话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用东北话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用甘肃话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用贵州话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用河南话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用湖北话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用湖南话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用江西话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用闽南话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用宁夏话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用山西话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用陕西话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用山东话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用上海话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用四川话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用天津话表达。<|endofprompt|>",
+                 "You are a helpful assistant. 请用云南话表达。<|endofprompt|>",
+                 "You are a helpful assistant. Please say a sentence as loudly as possible.<|endofprompt|>",
+                 "You are a helpful assistant. Please say a sentence in a very soft voice.<|endofprompt|>",
+                 "You are a helpful assistant. 请用尽可能慢地语速说一句话。<|endofprompt|>",
+                 "You are a helpful assistant. 请用尽可能快地语速说一句话。<|endofprompt|>",
+                 "You are a helpful assistant. 请非常开心地说一句话。<|endofprompt|>",
+                 "You are a helpful assistant. 请非常伤心地说一句话。<|endofprompt|>",
+                 "You are a helpful assistant. 请非常生气地说一句话。<|endofprompt|>",
+                 "You are a helpful assistant. 我想体验一下小猪佩奇风格，可以吗？<|endofprompt|>",
+                 "You are a helpful assistant. 你可以尝试用机器人的方式解答吗？<|endofprompt|>"]
 
 
 def pad_list(xs: List[torch.Tensor], pad_value: int):