diff --git a/dsLightRag/KeDaXunFei/XunFeiAudioEvaluator.py b/dsLightRag/KeDaXunFei/XunFeiAudioEvaluator.py index 0010199e..083cf7c8 100644 --- a/dsLightRag/KeDaXunFei/XunFeiAudioEvaluator.py +++ b/dsLightRag/KeDaXunFei/XunFeiAudioEvaluator.py @@ -274,9 +274,10 @@ if __name__ == '__main__': api_secret = XF_APISECRET api_key = XF_APIKEY # audio_file = "./1.mp3" - audio_file = r'D:\dsWork\dsProject\dsLightRag\static\audio\audio_1f0a8c47db2d4f9ba7674055a352cab8.wav' + audio_file = r'D:\dsWork\dsProject\dsLightRag\static\audio\audio_afc0a96e382c428cba2f00e3f71e4e8f.mp3' # 创建评测器实例 - evaluator = XunFeiAudioEvaluator(appid, api_key, api_secret, audio_file, "english","nice to meet you.") + txt="Hello everyone! Nice to meet you. Today is a beautiful day. I am learning English pronunciation with this tool." + evaluator = XunFeiAudioEvaluator(appid, api_key, api_secret, audio_file, "english",txt) # 运行评测 results, eval_time = evaluator.run_evaluation() diff --git a/dsLightRag/KeDaXunFei/__pycache__/XunFeiAudioEvaluator.cpython-310.pyc b/dsLightRag/KeDaXunFei/__pycache__/XunFeiAudioEvaluator.cpython-310.pyc index 159a75fe..d4b7efa0 100644 Binary files a/dsLightRag/KeDaXunFei/__pycache__/XunFeiAudioEvaluator.cpython-310.pyc and b/dsLightRag/KeDaXunFei/__pycache__/XunFeiAudioEvaluator.cpython-310.pyc differ diff --git a/dsLightRag/Routes/XunFeiRoute.py b/dsLightRag/Routes/XunFeiRoute.py index ae09e991..bf4cead5 100644 --- a/dsLightRag/Routes/XunFeiRoute.py +++ b/dsLightRag/Routes/XunFeiRoute.py @@ -37,13 +37,29 @@ async def save_audio(audio: UploadFile = File(...), txt: str = Form(...)): shutil.copy2(temp_file, file_path) logger.info(f"已保存文件到: {file_path}") + # 添加wav转mp3功能 + import subprocess + mp3_temp_file = os.path.join(temp_dir, f"temp_{uuid.uuid4().hex}.mp3") + try: + # 使用ffmpeg将wav转换为mp3 + subprocess.run( + ["ffmpeg", "-i", temp_file, "-y", mp3_temp_file], + check=True, + stdout=subprocess.PIPE, + stderr=subprocess.PIPE + ) + logger.info(f"已将wav转换为mp3: {mp3_temp_file}") + except subprocess.CalledProcessError as e: + logger.error(f"ffmpeg转换失败: {e.stderr.decode()}") + raise Exception(f"音频格式转换失败: {e.stderr.decode()}") + # 2. 讯飞评分 from KeDaXunFei.XunFeiAudioEvaluator import XunFeiAudioEvaluator evaluator = XunFeiAudioEvaluator( appid=XF_APPID, api_key=XF_APIKEY, api_secret=XF_APISECRET, - audio_file=temp_file, + audio_file=mp3_temp_file, # 使用转换后的mp3文件 language="english", txt=txt ) diff --git a/dsLightRag/Routes/__pycache__/XunFeiRoute.cpython-310.pyc b/dsLightRag/Routes/__pycache__/XunFeiRoute.cpython-310.pyc index fef601ed..e287f688 100644 Binary files a/dsLightRag/Routes/__pycache__/XunFeiRoute.cpython-310.pyc and b/dsLightRag/Routes/__pycache__/XunFeiRoute.cpython-310.pyc differ diff --git a/dsLightRag/static/XunFei/audio_evaluation.html b/dsLightRag/static/XunFei/audio_evaluation.html index 8272a3ab..d1d044d4 100644 --- a/dsLightRag/static/XunFei/audio_evaluation.html +++ b/dsLightRag/static/XunFei/audio_evaluation.html @@ -433,7 +433,7 @@

🎙️ 英语朗读评测

- +

📝 请朗读以下文本

diff --git a/dsLightRag/static/audio/audio_1013c986df5245f0bdf921aa5b198149.wav b/dsLightRag/static/audio/audio_1013c986df5245f0bdf921aa5b198149.wav deleted file mode 100644 index 555ca7f4..00000000 Binary files a/dsLightRag/static/audio/audio_1013c986df5245f0bdf921aa5b198149.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_1e213f49b6f84f96a3adc8eaaac14d61.wav b/dsLightRag/static/audio/audio_1e213f49b6f84f96a3adc8eaaac14d61.wav new file mode 100644 index 00000000..38e9d5e5 Binary files /dev/null and b/dsLightRag/static/audio/audio_1e213f49b6f84f96a3adc8eaaac14d61.wav differ diff --git a/dsLightRag/static/audio/audio_1f0a8c47db2d4f9ba7674055a352cab8.wav b/dsLightRag/static/audio/audio_1f0a8c47db2d4f9ba7674055a352cab8.wav deleted file mode 100644 index c5545770..00000000 Binary files a/dsLightRag/static/audio/audio_1f0a8c47db2d4f9ba7674055a352cab8.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_4bfaf83cdee94098813d77b79cacca8e.wav b/dsLightRag/static/audio/audio_4bfaf83cdee94098813d77b79cacca8e.wav deleted file mode 100644 index 5899a277..00000000 Binary files a/dsLightRag/static/audio/audio_4bfaf83cdee94098813d77b79cacca8e.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_76c396992ca94dd4b94250ac67e31820.wav b/dsLightRag/static/audio/audio_76c396992ca94dd4b94250ac67e31820.wav deleted file mode 100644 index 129e0eee..00000000 Binary files a/dsLightRag/static/audio/audio_76c396992ca94dd4b94250ac67e31820.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_8357cf7e4b754d118232f3bd08239ad4.wav b/dsLightRag/static/audio/audio_8357cf7e4b754d118232f3bd08239ad4.wav deleted file mode 100644 index 0385d9e9..00000000 Binary files a/dsLightRag/static/audio/audio_8357cf7e4b754d118232f3bd08239ad4.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_afc0a96e382c428cba2f00e3f71e4e8f.mp3 b/dsLightRag/static/audio/audio_afc0a96e382c428cba2f00e3f71e4e8f.mp3 new file mode 100644 index 00000000..dbc75607 Binary files /dev/null and b/dsLightRag/static/audio/audio_afc0a96e382c428cba2f00e3f71e4e8f.mp3 differ diff --git a/dsLightRag/static/audio/audio_afc0a96e382c428cba2f00e3f71e4e8f.wav b/dsLightRag/static/audio/audio_afc0a96e382c428cba2f00e3f71e4e8f.wav new file mode 100644 index 00000000..31ccb18a Binary files /dev/null and b/dsLightRag/static/audio/audio_afc0a96e382c428cba2f00e3f71e4e8f.wav differ diff --git a/dsLightRag/static/audio/audio_b54f70d60c784047be1a918904498905.wav b/dsLightRag/static/audio/audio_b54f70d60c784047be1a918904498905.wav deleted file mode 100644 index 8d83b140..00000000 Binary files a/dsLightRag/static/audio/audio_b54f70d60c784047be1a918904498905.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_e059db87ae8f4979b6dfea90766ee10d.wav b/dsLightRag/static/audio/audio_e059db87ae8f4979b6dfea90766ee10d.wav deleted file mode 100644 index 9b9bb852..00000000 Binary files a/dsLightRag/static/audio/audio_e059db87ae8f4979b6dfea90766ee10d.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_e36d2c22f1a64661ac1644304df7c732.wav b/dsLightRag/static/audio/audio_e36d2c22f1a64661ac1644304df7c732.wav deleted file mode 100644 index a99d0777..00000000 Binary files a/dsLightRag/static/audio/audio_e36d2c22f1a64661ac1644304df7c732.wav and /dev/null differ diff --git a/dsLightRag/static/audio/audio_fb4201ccadc94320a8fd820b0357ad35.wav b/dsLightRag/static/audio/audio_fb4201ccadc94320a8fd820b0357ad35.wav deleted file mode 100644 index 9876e7de..00000000 Binary files a/dsLightRag/static/audio/audio_fb4201ccadc94320a8fd820b0357ad35.wav and /dev/null differ diff --git a/dsLightRag/static/audio/eval_audio_0b3f382e-865a-487c-ac18-e8d6ecaca28d.wav b/dsLightRag/static/audio/eval_audio_0b3f382e-865a-487c-ac18-e8d6ecaca28d.wav deleted file mode 100644 index d26b87bd..00000000 Binary files a/dsLightRag/static/audio/eval_audio_0b3f382e-865a-487c-ac18-e8d6ecaca28d.wav and /dev/null differ diff --git a/dsLightRag/static/audio/eval_audio_777ae5af-d41f-4cf2-ab72-91204622626f.wav b/dsLightRag/static/audio/eval_audio_777ae5af-d41f-4cf2-ab72-91204622626f.wav deleted file mode 100644 index d26b87bd..00000000 Binary files a/dsLightRag/static/audio/eval_audio_777ae5af-d41f-4cf2-ab72-91204622626f.wav and /dev/null differ diff --git a/dsLightRag/static/audio/tts_20250902_073958_bd36e456.mp3 b/dsLightRag/static/audio/tts_20250902_073958_bd36e456.mp3 deleted file mode 100644 index 7c91656a..00000000 Binary files a/dsLightRag/static/audio/tts_20250902_073958_bd36e456.mp3 and /dev/null differ diff --git a/dsLightRag/static/audio/tts_20250902_074150_a7eb0d9a.mp3 b/dsLightRag/static/audio/tts_20250902_074150_a7eb0d9a.mp3 deleted file mode 100644 index f48c6b5f..00000000 Binary files a/dsLightRag/static/audio/tts_20250902_074150_a7eb0d9a.mp3 and /dev/null differ diff --git a/dsLightRag/static/audio/tts_20250902_074443_0df4889a.mp3 b/dsLightRag/static/audio/tts_20250902_074443_0df4889a.mp3 deleted file mode 100644 index 63bf21c2..00000000 Binary files a/dsLightRag/static/audio/tts_20250902_074443_0df4889a.mp3 and /dev/null differ diff --git a/dsLightRag/static/audio/tts_20250902_074755_81ca2382.mp3 b/dsLightRag/static/audio/tts_20250902_074755_81ca2382.mp3 deleted file mode 100644 index abd4d984..00000000 Binary files a/dsLightRag/static/audio/tts_20250902_074755_81ca2382.mp3 and /dev/null differ diff --git a/dsLightRag/static/audio/tts_20250902_075228_90ccd2a8.mp3 b/dsLightRag/static/audio/tts_20250902_075228_90ccd2a8.mp3 deleted file mode 100644 index 86edace8..00000000 Binary files a/dsLightRag/static/audio/tts_20250902_075228_90ccd2a8.mp3 and /dev/null differ