diff --git a/dsRag/Test/T2_read_word_content.py b/dsRag/Test/T2_read_word_content.py index 0e32002b..d8281e8f 100644 --- a/dsRag/Test/T2_read_word_content.py +++ b/dsRag/Test/T2_read_word_content.py @@ -63,4 +63,9 @@ if __name__ == "__main__": res = read_word_content(word_document_path) q = split_into_blocks(res) for x in q: - print(x[1]) + print("===段落开始:===") + firstLine = x[1].split("\n")[0].strip() + content = x[1][len(firstLine):].strip() + print("firstLine=" + firstLine) + print("content=" + content) + print("===段落结束:===\n")