# -*- coding: utf-8 -*- # # @author: # @date: # @version: # @description: from knowledgebase.db.doc_db_helper import doc_dbh from knowledgebase.doc.doc_processor import DocProcessor def test_process(): files = [ # r"D:\KnowledgeBase\doc\XA-5D无人机1553B总线传输通信帧分配(公开).docx", # r"D:\KnowledgeBase\doc\XA-5D无人机分系统遥测源包设计报告(公开).docx", # r"D:\KnowledgeBase\doc\XA-5D无人机软件用户需求(公开).docx", # r"D:\KnowledgeBase\doc\XA-5D无人机遥测大纲(公开).docx", # r"D:\KnowledgeBase\doc\XA-5D无人机遥测信号分配表(公开).docx", # r"D:\KnowledgeBase\doc\指令格式(公开).docx", # r"D:\KnowledgeBase\doc\HY-4A数管分系统遥测源包设计报告 Z 240824 更改3(内部) .docx", # r"D:\KnowledgeBase\doc\HY-4A数管分系统应用软件用户需求(星务管理分册) Z 240831 更改4(内部).docx", # r"D:\KnowledgeBase\doc\HY-4A卫星1553B总线传输通信帧分配 Z 240824 更改3(内部).docx", # r"D:\KnowledgeBase\doc\HY-4A卫星遥测大纲 Z 240824 更改3(内部).docx", # r"D:\KnowledgeBase\doc\通用-数管分系统指令格式与编码定义及使用准则,编写中V4,20240119(内部).docx" r"D:\projects\KnowledgeBase\doc_xx25\卫星遥测大纲Z250226(秘密★10年) - 副本.docx" # r"D:\KnowledgeBase\doc\指令格式.docx" ] for file in files: doc_processor = DocProcessor(file) doc_processor.process() def test_get_text_by_entity(): text = doc_dbh.get_text_with_entities(['遥测源包下传时机']) print(text) if __name__ == '__main__': test_process() # test_get_text_by_entity()