Local-Voice/doubao/config.py
2025-09-19 20:04:09 +08:00

67 lines
3.3 KiB
Python
Raw Blame History

This file contains ambiguous Unicode characters

This file contains Unicode characters that might be confused with other characters. If you think that this is intentional, you can safely ignore this warning. Use the Escape button to reveal them.

import uuid
import pyaudio
# 配置信息
audio_config = {
"prefer_native_format": True, # 是否优先使用平台原生格式
"fallback_to_int16": True, # 是否在Float32不支持时降级到Int16
"enable_aplay_fallback": True, # 是否启用aplay作为备选播放方式
}
ws_connect_config = {
"base_url": "wss://openspeech.bytedance.com/api/v3/realtime/dialogue",
"headers": {
"X-Api-App-ID": "8718217928",
"X-Api-Access-Key": "ynJMX-5ix1FsJvswC9KTNlGUdubcchqc",
"X-Api-Resource-Id": "volc.speech.dialog", # 固定值
"X-Api-App-Key": "PlgvMymc7f3tQnJ6", # 固定值
"X-Api-Connect-Id": str(uuid.uuid4()),
},
}
start_session_req = {
"asr": {
"extra": {
"end_smooth_window_ms": 1500,
},
},
"tts": {
"speaker": "zh_female_vv_jupiter_bigtts",
# "speaker": "S_XXXXXX", // 指定自定义的复刻音色,需要填下character_manifest
# "speaker": "ICL_zh_female_aojiaonvyou_tob" // 指定官方复刻音色不需要填character_manifest
"audio_config": {"channel": 1, "format": "pcm", "sample_rate": 24000},
},
"dialog": {
"bot_name": "豆包",
"system_role": "你使用活泼灵动的女声,性格开朗,热爱生活。",
"speaking_style": "你的说话风格简洁明了,语速适中,语调自然。",
# "character_manifest": "外貌与穿着\n26岁短发干净利落眉眼分明笑起来露出整齐有力的牙齿。体态挺拔肌肉线条不夸张但明显。常穿简单的衬衫或夹克看似随意但每件衣服都干净整洁给人一种干练可靠的感觉。平时冷峻眼神锐利专注时让人不自觉紧张。\n\n性格特点\n平时话不多不喜欢多说废话通常用“嗯”或者短句带过。但内心极为细腻特别在意身边人的感受只是不轻易表露。嘴硬是常态“少管我”是他的常用台词但会悄悄做些体贴的事情比如把对方喜欢的饮料放在手边。战斗或训练后常说“没事”但动作中透露出疲惫习惯用小动作缓解身体酸痛。\n性格上坚毅果断但不会冲动做事有条理且有原则。\n\n常用表达方式与口头禅\n\t•\t认可对方时\n“行吧这次算你靠谱。”声音稳重手却不自觉放松一下心里松口气\n\t•\t关心对方时\n“快点回去别磨蹭。”语气干脆但眼神一直追着对方的背影\n\t•\t想了解情况时\n“刚刚……你看到那道光了吗话语随意手指敲着桌面但内心紧张小心隐藏身份",
"location": {
"city": "北京",
},
"extra": {
"strict_audit": False,
"audit_response": "支持客户自定义安全审核回复话术。",
"recv_timeout": 10,
"input_mod": "audio",
},
},
}
input_audio_config = {
"chunk": 3200,
"format": "pcm",
"channels": 1,
"sample_rate": 16000,
"bit_size": pyaudio.paInt16,
}
output_audio_config = {
"chunk": 4096, # 增加缓冲区大小
"format": "pcm",
"channels": 1,
"sample_rate": 24000,
"bit_size": pyaudio.paFloat32, # 服务器返回的是Float32格式
}