mirror of
https://github.com/1Panel-dev/MaxKB.git
synced 2025-12-26 01:33:05 +00:00
fix: 修复文档提取doc图片没有保存和展示的问题
This commit is contained in:
parent
4dec2a6a58
commit
2a07a50a60
|
|
@ -19,5 +19,5 @@ class BaseParseTableHandle(ABC):
|
|||
pass
|
||||
|
||||
@abstractmethod
|
||||
def get_content(self, file):
|
||||
def get_content(self, file, save_image):
|
||||
pass
|
||||
|
|
@ -35,7 +35,7 @@ class CsvSplitHandle(BaseParseTableHandle):
|
|||
|
||||
return [{'name': file.name, 'paragraphs': paragraphs}]
|
||||
|
||||
def get_content(self, file):
|
||||
def get_content(self, file, save_image):
|
||||
buffer = file.read()
|
||||
try:
|
||||
return buffer.decode(detect(buffer)['encoding'])
|
||||
|
|
|
|||
|
|
@ -61,7 +61,7 @@ class XlsSplitHandle(BaseParseTableHandle):
|
|||
return [{'name': file.name, 'paragraphs': []}]
|
||||
return result
|
||||
|
||||
def get_content(self, file):
|
||||
def get_content(self, file, save_image):
|
||||
# 打开 .xls 文件
|
||||
try:
|
||||
workbook = xlrd.open_workbook(file_contents=file.read(), formatting_info=True)
|
||||
|
|
|
|||
|
|
@ -74,7 +74,7 @@ class XlsxSplitHandle(BaseParseTableHandle):
|
|||
return result
|
||||
|
||||
|
||||
def get_content(self, file):
|
||||
def get_content(self, file, save_image):
|
||||
try:
|
||||
# 加载 Excel 文件
|
||||
workbook = load_workbook(file)
|
||||
|
|
|
|||
Loading…
Reference in New Issue