|
|
|
@@ -3,6 +3,7 @@ |
|
|
|
import uuid |
|
|
|
from typing import Optional |
|
|
|
|
|
|
|
from configs import dify_config |
|
|
|
from core.model_manager import ModelInstance |
|
|
|
from core.rag.cleaner.clean_processor import CleanProcessor |
|
|
|
from core.rag.datasource.retrieval_service import RetrievalService |
|
|
|
@@ -80,6 +81,10 @@ class ParentChildIndexProcessor(BaseIndexProcessor): |
|
|
|
child_nodes = self._split_child_nodes( |
|
|
|
document, rules, process_rule.get("mode"), kwargs.get("embedding_model_instance") |
|
|
|
) |
|
|
|
if kwargs.get("preview"): |
|
|
|
if len(child_nodes) > dify_config.CHILD_CHUNKS_PREVIEW_NUMBER: |
|
|
|
child_nodes = child_nodes[: dify_config.CHILD_CHUNKS_PREVIEW_NUMBER] |
|
|
|
|
|
|
|
document.children = child_nodes |
|
|
|
doc_id = str(uuid.uuid4()) |
|
|
|
hash = helper.generate_text_hash(document.page_content) |