refactor: update dataset_id to knowledge_id in zip_split_handle.py and tools.py

This commit is contained in:
CaptainB 2025-06-18 21:28:33 +08:00
parent c0b770f41e
commit 45908b91ff

View File

@ -27,7 +27,6 @@ from common.handle.impl.text.text_split_handle import TextSplitHandle
from common.handle.impl.text.xls_split_handle import XlsSplitHandle
from common.handle.impl.text.xlsx_split_handle import XlsxSplitHandle
from common.utils.common import parse_md_image
from knowledge.models import File
class FileBufferHandle:
@ -39,22 +38,6 @@ class FileBufferHandle:
return self.buffer
def save_image(image_list):
if image_list is not None and len(image_list) > 0:
exist_image_list = [str(i.get('id')) for i in
QuerySet(File).filter(id__in=[i.id for i in image_list]).values('id')]
save_image_list = [image for image in image_list if not exist_image_list.__contains__(str(image.id))]
save_image_list = list({img.id: img for img in save_image_list}.values())
print('Saving images:', len(save_image_list))
# for file in save_image_list:
# file_bytes = file.meta.pop('content')
# file.meta['knowledge_id'] = self.data.get('knowledge_id')
# file.source_type = FileSourceType.KNOWLEDGE
# file.source_id = self.data.get('knowledge_id')
# file.save(file_bytes)
# if len(save_image_list) > 0:
# QuerySet(File).bulk_create(save_image_list)
default_split_handle = TextSplitHandle()
split_handles = [