You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

43 lines
2.0 KiB

This file contains ambiguous Unicode characters!

This file contains ambiguous Unicode characters that may be confused with others in your current locale. If your use case is intentional and legitimate, you can safely ignore this warning. Use the Escape button to highlight these characters.

import os
from openai import OpenAI
client = OpenAI(
# 若没有配置环境变量请用百炼API Key将下行替换为api_key="sk-xxx",
api_key='sk-f6da0c787eff4b0389e4ad03a35a911f',
base_url="https://dashscope.aliyuncs.com/compatible-mode/v1",
)
prompt = "请提取图片中的试题"
prompt += "1、需要Latex公式输出的注意加上 $$ 或 $ 进行包含。"
prompt += "2、以中文数字开头的行请忽律掉此行比如 一、单项选择题 二、填空题 ..."
prompt += "3、输出格式 【题型】xxx 【题目内容】 xxx 【答案】 xxxx 【解析】 xxxx。"
completion = client.chat.completions.create(
model="qwen-vl-ocr-latest",
messages=[
{
"role": "user",
"content": [
{
"type": "image_url",
"image_url": "https://pic1.zhimg.com/v2-c3d7f060bbf3f7c122319350044d8888_1440w.jpg",
# 输入图像的最小像素阈值小于该值图像会按原比例放大直到总像素大于min_pixels
"min_pixels": 28 * 28 * 4,
# 输入图像的最大像素阈值超过该值图像会按原比例缩小直到总像素低于max_pixels
"max_pixels": 28 * 28 * 8192
},
# qwen-vl-ocr-latest支持在以下text字段中传入Prompt若未传入则会使用默认的PromptPlease output only the text content from the image without any additional descriptions or formatting.
# 如调用qwen-vl-ocr-1028模型会使用固定PromptRead all the text in the image.不支持用户在text中传入自定义Prompt
{"type": "text",
"text": prompt},
]
}
])
print(completion.choices[0].message.content)
# 将返回的内容保存到 2、识别出结果.md 中
with open('2、识别出结果.md', 'w', encoding='utf-8') as f:
f.write(completion.choices[0].message.content)
print("保存成功!")