QingLong/AI/Neo4j/KnowledgeGraph.py

# -*- coding: utf-8 -*-
import re
import time
from typing import Iterator, Tuple
from openai import OpenAI
from openai.types.chat import ChatCompletionChunk
from Config import *


class KnowledgeGraph:
    def __init__(self, shiti_content: str):
        self.shiti_content = shiti_content
        self.client = OpenAI(api_key=HW_API_KEY, base_url=HW_API_URL)

    def _generate_stream(self) -> Iterator[ChatCompletionChunk]:
        """流式生成内容"""
        system_prompt = '''回答以下内容:
1. 这道题目有哪些知识点，哪些能力点
2. 生成Neo4j 5.26.2的插入语句'''
        return self.client.chat.completions.create(
            model=MODEL_NAME,
            messages=[
                {"role": "system", "content": system_prompt},
                {"role": "user", "content": self.shiti_content}
            ],
            stream=True,
            timeout=300
        )

    def _extract_cypher(self, content: str) -> str:
        """从内容中提取Cypher语句（修正版）"""
        # 匹配包含cypher的代码块（支持可选语言声明）
        pattern = r"```(?:cypher)?\n(.*?)```"
        matches = re.findall(pattern, content, re.DOTALL)

        processed = []
        for block in matches:
            # 清理每行：移除注释和首尾空格
            cleaned_lines = []
            for line in block.split('\n'):
                line = line.split('//')[0].strip()  # 移除行尾注释
                if line:  # 保留非空行
                    cleaned_lines.append(line)
            if cleaned_lines:
                processed.append('\n'.join(cleaned_lines))

        return ';\n\n'.join(processed) if processed else ""

    def run(self) -> Tuple[bool, str, str]:
        """执行生成流程（返回状态、完整内容、Cypher语句）"""
        start_time = time.time()
        spinner = ['⠋', '⠙', '⠹', '⠸', '⠼', '⠴', '⠦', '⠧', '⠇', '⠏']
        content_buffer = []
        cypher_script = ""

        try:
            print(f"🚀 开始生成知识点和能力点的总结和插入语句")
            stream = self._generate_stream()

            for idx, chunk in enumerate(stream):
                print(f"\r{spinner[idx % 10]} 生成中（{int(time.time() - start_time)}秒）", end="")

                if chunk.choices and chunk.choices[0].delta.content:
                    content_chunk = chunk.choices[0].delta.content
                    content_buffer.append(content_chunk)

                    if len(content_buffer) == 1:
                        print("\n\n📝 内容生成开始：")
                    print(content_chunk, end="", flush=True)

            if content_buffer:
                full_content = ''.join(content_buffer)
                cypher_script = self._extract_cypher(full_content)

                print(f"\n\n✅ 生成成功！耗时 {int(time.time() - start_time)}秒")
                print("\n================ 完整结果 ================")
                print(full_content)
                print("\n================ Cypher语句 ===============")
                print(cypher_script if cypher_script else "未检测到Cypher语句")
                print("==========================================")
                return True, full_content, cypher_script
            return False, "", ""

        except Exception as e:
            print(f"\n\n❌ 生成失败：{str(e)}")
            return False, str(e), ""


if __name__ == '__main__':
    shiti_content = '''
    下面是一道小学三年级的数学题目，巧求周长：
    把7个完全相同的小长方形拼成如图的样子，已知每个小长方形的长是10厘米，则拼成的大长方形的周长是多少厘米？    
    '''
    kg = KnowledgeGraph(shiti_content)
    success, result, cypher = kg.run()

    if success and cypher:
        with open("knowledge_graph.cypher", "w", encoding="utf-8") as f:
            f.write(cypher)
        print("\nCypher语句已保存至 knowledge_graph.cypher")
-												'commit'

											
										
										
											5 months ago
+								# -*- coding: utf-8 -*-
-												'commit'

											
										
										
											5 months ago
+								import re
-												'commit'

											
										
										
											5 months ago
+								import time
-												'commit'

											
										
										
											5 months ago
+								from typing import Iterator, Tuple
-												'commit'

											
										
										
											5 months ago
+								from openai import OpenAI
 								from openai.types.chat import ChatCompletionChunk
-												'commit'

											
										
										
											5 months ago
+								from Config import *
-												'commit'

											
										
										
											5 months ago
 								class KnowledgeGraph:
-												'commit'

											
										
										
											5 months ago
+								    def __init__(self, shiti_content: str):
 								        self.shiti_content = shiti_content
 								        self.client = OpenAI(api_key=HW_API_KEY, base_url=HW_API_URL)
-												'commit'

											
										
										
											5 months ago
-												'commit'

											
										
										
											5 months ago
+								    def _generate_stream(self) -> Iterator[ChatCompletionChunk]:
-												'commit'

											
										
										
											5 months ago
+								        """流式生成内容"""
-												'commit'

											
										
										
											5 months ago
+								        system_prompt = '''回答以下内容:
 . 这道题目有哪些知识点，哪些能力点
 . 生成Neo4j 5.26.2的插入语句'''
 								        return self.client.chat.completions.create(
-												'commit'

											
										
										
											5 months ago
+								            model=MODEL_NAME,
-												'commit'

											
										
										
											5 months ago
+								            messages=[
 								                {"role": "system", "content": system_prompt},
-												'commit'

											
										
										
											5 months ago
+								                {"role": "user", "content": self.shiti_content}
-												'commit'

											
										
										
											5 months ago
+								            ],
 								            stream=True,
-												'commit'

											
										
										
											5 months ago
+								            timeout=300
-												'commit'

											
										
										
											5 months ago
+								        )
-												'commit'

											
										
										
											5 months ago
+								    def _extract_cypher(self, content: str) -> str:
 								        """从内容中提取Cypher语句（修正版）"""
 								        # 匹配包含cypher的代码块（支持可选语言声明）
 								        pattern = r"```(?:cypher)?\n(.*?)```"
 								        matches = re.findall(pattern, content, re.DOTALL)
 								        processed = []
 								        for block in matches:
 								            # 清理每行：移除注释和首尾空格
 								            cleaned_lines = []
 								            for line in block.split('\n'):
 								                line = line.split('//')[0].strip()  # 移除行尾注释
 								                if line:  # 保留非空行
 								                    cleaned_lines.append(line)
 								            if cleaned_lines:
 								                processed.append('\n'.join(cleaned_lines))
 								        return ';\n\n'.join(processed) if processed else ""
 								    def run(self) -> Tuple[bool, str, str]:
 								        """执行生成流程（返回状态、完整内容、Cypher语句）"""
-												'commit'

											
										
										
											5 months ago
+								        start_time = time.time()
 								        spinner = ['⠋', '⠙', '⠹', '⠸', '⠼', '⠴', '⠦', '⠧', '⠇', '⠏']
 								        content_buffer = []
-												'commit'

											
										
										
											5 months ago
+								        cypher_script = ""
-												'commit'

											
										
										
											5 months ago
 								        try:
 								            print(f"🚀 开始生成知识点和能力点的总结和插入语句")
-												'commit'

											
										
										
											5 months ago
+								            stream = self._generate_stream()
-												'commit'

											
										
										
											5 months ago
-												'commit'

											
										
										
											5 months ago
+								            for idx, chunk in enumerate(stream):
-												'commit'

											
										
										
											5 months ago
+								                print(f"\r{spinner[idx % 10]} 生成中（{int(time.time() - start_time)}秒）", end="")
-												'commit'

											
										
										
											5 months ago
+								                if chunk.choices and chunk.choices[0].delta.content:
 								                    content_chunk = chunk.choices[0].delta.content
 								                    content_buffer.append(content_chunk)
 								                    if len(content_buffer) == 1:
 								                        print("\n\n📝 内容生成开始：")
 								                    print(content_chunk, end="", flush=True)
-												'commit'

											
										
										
											5 months ago
 								            if content_buffer:
-												'commit'

											
										
										
											5 months ago
+								                full_content = ''.join(content_buffer)
-												'commit'

											
										
										
											5 months ago
+								                cypher_script = self._extract_cypher(full_content)
-												'commit'

											
										
										
											5 months ago
+								                print(f"\n\n✅ 生成成功！耗时 {int(time.time() - start_time)}秒")
-												'commit'

											
										
										
											5 months ago
+								                print("\n================ 完整结果 ================")
 								                print(full_content)
-												'commit'

											
										
										
											5 months ago
+								                print("\n================ Cypher语句 ===============")
 								                print(cypher_script if cypher_script else "未检测到Cypher语句")
 								                print("==========================================")
 								                return True, full_content, cypher_script
 								            return False, "", ""
-												'commit'

											
										
										
											5 months ago
 								        except Exception as e:
 								            print(f"\n\n❌ 生成失败：{str(e)}")
-												'commit'

											
										
										
											5 months ago
+								            return False, str(e), ""
-												'commit'

											
										
										
											5 months ago
 								if __name__ == '__main__':
-												'commit'

											
										
										
											5 months ago
+								    shiti_content = '''
-												'commit'

											
										
										
											5 months ago
+								    下面是一道小学三年级的数学题目，巧求周长：
 								    把7个完全相同的小长方形拼成如图的样子，已知每个小长方形的长是10厘米，则拼成的大长方形的周长是多少厘米？
 								    '''
-												'commit'

											
										
										
											5 months ago
+								    kg = KnowledgeGraph(shiti_content)
-												'commit'

											
										
										
											5 months ago
+								    success, result, cypher = kg.run()
-												'commit'

											
										
										
											5 months ago
-												'commit'

											
										
										
											5 months ago
+								    if success and cypher:
 								        with open("knowledge_graph.cypher", "w", encoding="utf-8") as f:
 								            f.write(cypher)
 								        print("\nCypher语句已保存至 knowledge_graph.cypher")