fix: PDF上传知识库开始导入接口报错 #122 (#125)

This commit is contained in:
shaohuzhang1 2024-04-16 20:59:27 +08:00 committed by GitHub
parent 5b7ae292ec
commit 5e499e6afa
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -336,6 +336,7 @@ class SplitModel:
:return: 解析后数据 {content:段落数据,keywords:[段落关键词],parent_chain:['段落父级链路']}
"""
text = text.replace('\r', '\n')
text = text.replace("\0", '')
result_tree = self.parse_to_tree(text, 0)
result = result_tree_to_paragraph(result_tree, [], [])
return [item for item in [self.post_reset_paragraph(row) for row in result] if