From d9af5f2a2aa5c0d76f154389718050aacb1c341f Mon Sep 17 00:00:00 2001 From: HuangHai <10402852@qq.com> Date: Thu, 26 Jun 2025 10:20:46 +0800 Subject: [PATCH] 'commit' --- dsRag/Test/T12.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/dsRag/Test/T12.py b/dsRag/Test/T12.py index 736853c2..61aee319 100644 --- a/dsRag/Test/T12.py +++ b/dsRag/Test/T12.py @@ -4,6 +4,8 @@ pip install faiss-cpu import re from Util.SplitDocxUtil import SplitDocxUtil +# 源文件 +input_file = '../Txt/小学数学(史校长).docx' def split_into_blocks(text): """使用正则表达式匹配问题和话题的标题及内容""" @@ -12,12 +14,10 @@ def split_into_blocks(text): return [(i + 1, title + content) for i, (title, content) in enumerate(blocks)] -# 源文件 -input_file = '../Txt/小学数学(史校长).docx' """处理文档主函数""" text = SplitDocxUtil.read_docx(input_file) - +# 切开块 blocks = split_into_blocks(text) # 将块编码并添加到向量数据库