小程序在9月27日发布了正式版

This commit is contained in:
qcloud
2025-10-01 08:29:09 +08:00
parent 8d90798647
commit c44e6715a0
15 changed files with 6679 additions and 25074 deletions

View File

@@ -1091,6 +1091,7 @@ class QwenTTS:
self.synthesizer = None
self.callback = None
self.is_cosyvoice = False
self.is_cosyvoice_v2 = False
self.cosyvoice = ""
self.voice = ""
self.format = format
@@ -1103,6 +1104,9 @@ class QwenTTS:
self.is_cosyvoice = True
self.cosyvoice = parts[0]
self.voice = parts[1]
if parts[0] == 'cosyvoice-v2':
self.is_cosyvoice_v2 = True
logging.info(f"---begin--init QwenTTS-- {format} {sample_rate} {model_name} {self.cosyvoice} {self.voice}") # cyx
self.completion_event = None # 新增:用于通知任务完成
# 特殊字符及其拼音映射
@@ -1292,6 +1296,12 @@ class QwenTTS:
"""
在文本中查找特殊字符并用<phoneme>标签包裹它们
"""
"""
SSMLSpeech Synthesis Markup Language 是一种基于 XML 的语音合成标记语言。
它不仅能让语音合成大模型读出更丰富的文本内容,还支持对语速、语调、停顿、音量等语音特征进行精细控制,
甚至可以添加背景音乐带来更具表现力的语音效果。本文介绍CosyVoice的SSML功能及使用。
仅限cosyvoice-v2模型
"""
# 如果文本已经是SSML格式直接返回
if text.strip().startswith("<speak>") and text.strip().endswith("</speak>"):
return text
@@ -1311,7 +1321,9 @@ class QwenTTS:
return f"<speak>{text}</speak>"
def text_tts_call(self, text):
if self.special_characters :
# SSMLSpeech Synthesis Markup Language 是一种基于 XML 的语音合成标记语言。
# 仅限cosyvoice-v2模型
if self.special_characters and self.is_cosyvoice_v2 :
text = self.apply_phoneme_tags(text)
#logging.info(f"Applied SSML phoneme tags to text: {text}")
volume = 50