Add `--disable-echo-cancellation` CLI option and update audio pipeline to support toggling echo cancellation and VAD

Files changed (3) hide show

main.py CHANGED Viewed

@@ -79,7 +79,7 @@ VoiceDialogue - 语音对话系统
             print(f"语言设置: {args.language}")
             print(f"说话人: {args.speaker}")
             print("正在启动命令行语音对话系统...")
-            launch_system(args.language, args.speaker)
         elif args.mode == 'api':
             launch_api_server(

             print(f"语言设置: {args.language}")
             print(f"说话人: {args.speaker}")
             print("正在启动命令行语音对话系统...")
+            launch_system(args.language, args.speaker, args.disable_echo_cancellation)
         elif args.mode == 'api':
             launch_api_server(

src/voice_dialogue/cli/args.py CHANGED Viewed

@@ -68,6 +68,12 @@ def create_argument_parser():
         default='沈逸' if '沈逸' in available_speakers else (available_speakers[0] if available_speakers else '沈逸'),
         help='TTS说话人 (默认: 沈逸)'
     )
     # API服务器模式参数
     api_group = parser.add_argument_group('API服务器模式参数')

         default='沈逸' if '沈逸' in available_speakers else (available_speakers[0] if available_speakers else '沈逸'),
         help='TTS说话人 (默认: 沈逸)'
     )
+    cli_group.add_argument(
+        '--disable-echo-cancellation',
+        action='store_true',
+        default=False,
+        help='禁用回声消除功能 (默认: 启用)'
+    )
     # API服务器模式参数
     api_group = parser.add_argument_group('API服务器模式参数')

src/voice_dialogue/core/launcher.py CHANGED Viewed

@@ -25,7 +25,8 @@ from voice_dialogue.utils.logger import logger
 def launch_system(
         user_language: str,
-        speaker: str
 ) -> None:
     """
     启动完整的语音对话系统
@@ -61,14 +62,22 @@ def launch_system(
     threads = []
     # 音频采集
-    audio_frame_probe = AudioCapture(audio_frames_queue=audio_frames_queue)
     audio_frame_probe.start()
     threads.append(audio_frame_probe)
     # 语音状态监测
     user_voice_checker = SpeechStateMonitor(
         audio_frame_queue=audio_frames_queue,
         user_voice_queue=user_voice_queue,
     )
     user_voice_checker.start()
     threads.append(user_voice_checker)

 def launch_system(
         user_language: str,
+        speaker: str,
+        disable_echo_cancellation: bool = False,
 ) -> None:
     """
     启动完整的语音对话系统
     threads = []
     # 音频采集
+    enable_echo_cancellation = not disable_echo_cancellation
+    logger.info(f"Echo Cancellation: {enable_echo_cancellation}")
+    audio_frame_probe = AudioCapture(
+        audio_frames_queue=audio_frames_queue,
+        enable_echo_cancellation=enable_echo_cancellation
+    )
     audio_frame_probe.start()
     threads.append(audio_frame_probe)
     # 语音状态监测
+    enable_vad = disable_echo_cancellation
+    logger.info(f"VAD: {enable_vad}")
     user_voice_checker = SpeechStateMonitor(
         audio_frame_queue=audio_frames_queue,
         user_voice_queue=user_voice_queue,
+        enable_vad=enable_vad
     )
     user_voice_checker.start()
     threads.append(user_voice_checker)