mirror of
https://github.com/1Panel-dev/MaxKB.git
synced 2025-12-26 01:33:05 +00:00
fix: 向量化的时候限制最大值
This commit is contained in:
parent
47cb83ce0c
commit
740f1d3dd1
|
|
@ -8,7 +8,20 @@
|
|||
"""
|
||||
import importlib
|
||||
from functools import reduce
|
||||
from typing import Dict
|
||||
from typing import Dict, List
|
||||
|
||||
|
||||
def sub_array(array: List, item_num=50):
|
||||
result = []
|
||||
temp = []
|
||||
for item in array:
|
||||
temp.append(item)
|
||||
if len(temp) >= item_num:
|
||||
result.append(temp)
|
||||
temp = []
|
||||
if len(temp) > 0:
|
||||
result.append(temp)
|
||||
return result
|
||||
|
||||
|
||||
def query_params_to_single_dict(query_params: Dict):
|
||||
|
|
|
|||
|
|
@ -12,6 +12,7 @@ from typing import List, Dict
|
|||
from langchain.embeddings import HuggingFaceEmbeddings
|
||||
|
||||
from common.config.embedding_config import EmbeddingModel
|
||||
from common.util.common import sub_array
|
||||
from embedding.models import SourceType
|
||||
|
||||
|
||||
|
|
@ -80,7 +81,9 @@ class BaseVectorStore(ABC):
|
|||
if embedding is None:
|
||||
embedding = EmbeddingModel.get_embedding_model()
|
||||
self.save_pre_handler()
|
||||
self._batch_save(data_list, embedding)
|
||||
result = sub_array(data_list)
|
||||
for child_array in result:
|
||||
self._batch_save(child_array, embedding)
|
||||
return True
|
||||
|
||||
@abstractmethod
|
||||
|
|
|
|||
Loading…
Reference in New Issue