|
|
|
@ -3,7 +3,7 @@ import subprocess
|
|
|
|
|
import uuid
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_docx_content_by_pandoc(docx_file, output_file=None, extract_media=None):
|
|
|
|
|
def get_docx_content_by_pandoc(docx_file, output_file=None, parent_dir=None):
|
|
|
|
|
# 最后拼接的内容
|
|
|
|
|
content = ""
|
|
|
|
|
# output_file 设置为临时目录下的uuid.md
|
|
|
|
@ -11,10 +11,16 @@ def get_docx_content_by_pandoc(docx_file, output_file=None, extract_media=None):
|
|
|
|
|
# 将docx_file去掉扩展名
|
|
|
|
|
prefix = docx_file.split(".")[0].split("/")[-1]
|
|
|
|
|
temp_markdown = os.path.join('./static/markdown/', prefix + '.md')
|
|
|
|
|
if parent_dir:
|
|
|
|
|
temp_markdown = os.path.join('../static/markdown/', prefix + '.md')
|
|
|
|
|
# 调用pandoc将docx文件转换成markdown
|
|
|
|
|
if extract_media is None:
|
|
|
|
|
if parent_dir is None:
|
|
|
|
|
os.mkdir("./static/Images/" + file_name)
|
|
|
|
|
extract_media = "./static/Images/"
|
|
|
|
|
else:
|
|
|
|
|
os.mkdir("../static/Images/" + file_name)
|
|
|
|
|
extract_media = "../static/Images/"
|
|
|
|
|
|
|
|
|
|
subprocess.run(['pandoc', docx_file, '-f', 'docx', '-t', 'markdown', '-o', temp_markdown,
|
|
|
|
|
'--extract-media=' + extract_media + file_name])
|
|
|
|
|
# 读取然后修改内容,输出到新的文件
|
|
|
|
|