From 499fc90f2f47f0a9265175cf3bd87321d6e603f8 Mon Sep 17 00:00:00 2001 From: shaohuzhang1 <80892890+shaohuzhang1@users.noreply.github.com> Date: Tue, 16 Jul 2024 10:59:13 +0800 Subject: [PATCH] =?UTF-8?q?fix:=20=E4=BF=AE=E5=A4=8D=E5=9C=A8=E7=BA=BF?= =?UTF-8?q?=E7=9F=A5=E8=AF=86=E5=BA=93=E7=88=AC=E5=8F=96=E6=96=87=E6=A1=A3?= =?UTF-8?q?=E5=90=8D=E8=B6=85=E8=BF=87128=E4=B8=AA=E5=AD=97=E7=AC=A6?= =?UTF-8?q?=E6=8A=A5=E9=94=99=20#706=20(#778)?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit (cherry picked from commit 32498114282a0d4afbf3bbc8eb305a1c17f01700) --- apps/dataset/serializers/document_serializers.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/apps/dataset/serializers/document_serializers.py b/apps/dataset/serializers/document_serializers.py index 9496ac7e1..07a39b578 100644 --- a/apps/dataset/serializers/document_serializers.py +++ b/apps/dataset/serializers/document_serializers.py @@ -656,13 +656,13 @@ class DocumentSerializers(ApiMixin, serializers.Serializer): paragraphs = get_split_model('web.md').parse(response.content) # 插入 DocumentSerializers.Create(data={'dataset_id': dataset_id}).save( - {'name': source_url, 'paragraphs': paragraphs, + {'name': source_url[0:128], 'paragraphs': paragraphs, 'meta': {'source_url': source_url, 'selector': selector}, 'type': Type.web}, with_valid=True) except Exception as e: logging.getLogger("max_kb_error").error(f'{str(e)}:{traceback.format_exc()}') else: - Document(name=source_url, + Document(name=source_url[0:128], meta={'source_url': source_url, 'selector': selector}, type=Type.web, char_length=0,