diff --git a/server/knowledge_base/utils.py b/server/knowledge_base/utils.py index a1ed94e..36c972b 100644 --- a/server/knowledge_base/utils.py +++ b/server/knowledge_base/utils.py @@ -191,7 +191,7 @@ class KnowledgeFile: # TODO: 增加依据文件格式匹配text_splitter self.text_splitter_name = None - def file2text(self, using_zh_title_enhance=ZH_TITLE_ENHANCE, refresh: bool = False, build_meta_data: bool = True): + def file2text(self, using_zh_title_enhance=ZH_TITLE_ENHANCE, refresh: bool = False): if self.docs is not None and not refresh: return self.docs @@ -251,17 +251,6 @@ class KnowledgeFile: docs = loader.load_and_split(text_splitter) - if build_meta_data: - - meta_data = docs[0].metadata - # 对meta_data每项格式化成 "":"" 形式 - meta_data = {f'"{k}":"{v}"' for k, v in meta_data.items()} - # 转换成字符串 - meta_data = "\r\n" + "\r\n\b".join(meta_data) + "\r\n" - doc = Document(page_content=str(meta_data), metadata=docs[0].metadata) - # 将doc 添加到docs的第一项 - docs.insert(0, doc) - print(docs[0]) if using_zh_title_enhance: docs = zh_title_enhance(docs)