From acde3bd32f07bf02839a21e8fe5b4e69bfca2251 Mon Sep 17 00:00:00 2001 From: lyg <1543117173@qq.com> Date: 星期三, 14 五月 2025 10:37:00 +0800 Subject: [PATCH] docx文档拆分,文档段落实体词提取,存入mysql数据库。 --- knowledgebase/db/neo4j.py | 19 ++++++++++++++++++- 1 files changed, 18 insertions(+), 1 deletions(-) diff --git a/knowledgebase/db/neo4j.py b/knowledgebase/db/neo4j.py index 5b9f887..b0916f4 100644 --- a/knowledgebase/db/neo4j.py +++ b/knowledgebase/db/neo4j.py @@ -24,7 +24,15 @@ entities=json.dumps(page_info.entities, ensure_ascii=False, indent=2)) self.graph.create(node) return node - + def create_trunk_node(self, trunk, entities): + """ + 鍒涘缓椤甸潰鑺傜偣 + """ + # 鍒涘缓鑺傜偣 + node = Node("Trunk", trunk=trunk, + entities=json.dumps(entities, ensure_ascii=False, indent=2)) + self.graph.create(node) + return node def create_entity_node(self, entity: str): """ 鍒涘缓瀹炰綋鑺傜偣 @@ -36,6 +44,15 @@ self.graph.create(node) return node + + def create_trunk_entity_relationship(self, page_node, entity_node): + """ + 鍒涘缓椤甸潰鍜屽疄浣撹妭鐐圭殑鍏崇郴 + """ + relationship = Relationship(page_node, "trunk_entity", entity_node) + self.graph.create(relationship) + return relationship + def create_page_entity_relationship(self, page_node, entity_node): """ 鍒涘缓椤甸潰鍜屽疄浣撹妭鐐圭殑鍏崇郴 -- Gitblit v1.9.1