diff --git a/apps/common/handle/impl/pdf_split_handle.py b/apps/common/handle/impl/pdf_split_handle.py index ca6d3bbde..99e238783 100644 --- a/apps/common/handle/impl/pdf_split_handle.py +++ b/apps/common/handle/impl/pdf_split_handle.py @@ -236,14 +236,28 @@ class PdfSplitHandle(BaseSplitHandle): # 目录中没有前言部分,手动处理 if handle_pre_toc: - if pattern_list is not None and len(pattern_list) > 0: - split_model = SplitModel(pattern_list, with_filter, limit) - else: - split_model = SplitModel(default_pattern_list, with_filter=with_filter, limit=limit) - # 插入目录前的部分 - page_content = re.sub(r'(? 0: + split_model = SplitModel(pattern_list, with_filter, limit) + else: + split_model = SplitModel(default_pattern_list, with_filter=with_filter, limit=limit) + # 插入目录前的部分 + page_content = re.sub(r'(?