From 53269506bfa28f55fb378d8c3c1efba5bf927f49 Mon Sep 17 00:00:00 2001 From: jyong Date: Tue, 19 Mar 2024 20:29:02 +0800 Subject: [PATCH] fix page content is empty --- .../index_processor/processor/paragraph_index_processor.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/api/core/rag/index_processor/processor/paragraph_index_processor.py b/api/core/rag/index_processor/processor/paragraph_index_processor.py index 3f0467ee24..0f282c4261 100644 --- a/api/core/rag/index_processor/processor/paragraph_index_processor.py +++ b/api/core/rag/index_processor/processor/paragraph_index_processor.py @@ -48,8 +48,9 @@ class ParagraphIndexProcessor(BaseIndexProcessor): page_content = page_content[1:] else: page_content = page_content - document_node.page_content = page_content - split_documents.append(document_node) + if page_content: + document_node.page_content = page_content + split_documents.append(document_node) all_documents.extend(split_documents) return all_documents