From e4bcce494627f746f37e8adaf209ed72557acfc7 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E6=9C=B1=E6=BD=AE?= Date: Fri, 19 Sep 2025 20:44:35 +0800 Subject: [PATCH] fix audio --- doubao/audio_manager.py | 4 ++-- doubao/config.py | 6 ++---- 2 files changed, 4 insertions(+), 6 deletions(-) diff --git a/doubao/audio_manager.py b/doubao/audio_manager.py index 7ed689d..9af8800 100644 --- a/doubao/audio_manager.py +++ b/doubao/audio_manager.py @@ -20,7 +20,7 @@ from realtime_dialog_client import RealtimeDialogClient class AudioConfig: """音频配置数据类""" format: str - bit_size: int + bit_size: str # 改为字符串类型 channels: int sample_rate: int chunk: int @@ -115,7 +115,7 @@ class DialogSession: output_audio_format=output_audio_format, mod=mod, recv_timeout=recv_timeout) if output_audio_format == "pcm_s16le": config.output_audio_config["format"] = "pcm_s16le" - config.output_audio_config["bit_size"] = pyaudio.paInt16 + config.output_audio_config["bit_size"] = "int16" # 使用字符串标识符 self.is_running = True self.is_session_finished = False diff --git a/doubao/config.py b/doubao/config.py index 3bb6cd1..c388772 100644 --- a/doubao/config.py +++ b/doubao/config.py @@ -1,7 +1,5 @@ import uuid -import pyaudio - # 配置信息 ws_connect_config = { "base_url": "wss://openspeech.bytedance.com/api/v3/realtime/dialogue", @@ -48,7 +46,7 @@ input_audio_config = { "format": "pcm", "channels": 1, "sample_rate": 16000, - "bit_size": pyaudio.paInt16, + "bit_size": "int16", } output_audio_config = { @@ -56,5 +54,5 @@ output_audio_config = { "format": "pcm", "channels": 1, "sample_rate": 24000, - "bit_size": pyaudio.paInt16, + "bit_size": "int16", }