From 08f027a52050c80983973dda6e869da5dc3902a1 Mon Sep 17 00:00:00 2001 From: HuangHai <10402852@qq.com> Date: Wed, 16 Apr 2025 08:36:36 +0800 Subject: [PATCH] 'commit' --- .../core/handle/receiveAudioHandle.py | 1 + XiaoZhi/文档/技术文档分析.txt | 15 ++++++++++++++- 2 files changed, 15 insertions(+), 1 deletion(-) diff --git a/XiaoZhi/xiaozhi-esp32-server/main/xiaozhi-server/core/handle/receiveAudioHandle.py b/XiaoZhi/xiaozhi-esp32-server/main/xiaozhi-server/core/handle/receiveAudioHandle.py index f798739a..7a2a47b2 100644 --- a/XiaoZhi/xiaozhi-esp32-server/main/xiaozhi-server/core/handle/receiveAudioHandle.py +++ b/XiaoZhi/xiaozhi-esp32-server/main/xiaozhi-server/core/handle/receiveAudioHandle.py @@ -35,6 +35,7 @@ async def handleAudioMessage(conn, audio): if len(conn.asr_audio) < 15: conn.asr_server_receive = True else: + logger.bind(tag=TAG).info(f"==========开始识别==============") text, file_path = await conn.asr.speech_to_text( conn.asr_audio, conn.session_id ) diff --git a/XiaoZhi/文档/技术文档分析.txt b/XiaoZhi/文档/技术文档分析.txt index 588726a2..5e3e6405 100644 --- a/XiaoZhi/文档/技术文档分析.txt +++ b/XiaoZhi/文档/技术文档分析.txt @@ -1,5 +1,11 @@ 1、ASR D:\dsWork\QingLong\XiaoZhi\xiaozhi-esp32-server\main\xiaozhi-server\core\handle\receiveAudioHandle.py + +在第12行,大约这个位置下断点,可以跟踪到流程 +async def handleAudioMessage(conn, audio): + if not conn.asr_server_receive: + +某些场景下,在38行下断点可以拦截到内容 if conn.client_voice_stop: conn.client_abort = False conn.asr_server_receive = False @@ -10,4 +16,11 @@ D:\dsWork\QingLong\XiaoZhi\xiaozhi-esp32-server\main\xiaozhi-server\core\handle\ text, file_path = await conn.asr.speech_to_text( conn.asr_audio, conn.session_id ) -约第38行 + +跟踪进入 +D:\dsWork\QingLong\XiaoZhi\xiaozhi-esp32-server\main\xiaozhi-server\core\providers\asr\fun_local.py +76行 + async def speech_to_text(self, opus_data: List[bytes], session_id: str) -> Tuple[Optional[str], Optional[str]]: + """语音转文本主处理逻辑""" + file_path = None + try: