Browse Source

chore: skip document segments fetching with non-existed dataset of DatasetDocument in add_document_to_index_task task (#17784)

tags/1.3.0
Bowen Liang 6 months ago
parent
commit
636a0ba37f
No account linked to committer's email address
1 changed files with 4 additions and 5 deletions
  1. 4
    5
      api/tasks/add_document_to_index_task.py

+ 4
- 5
api/tasks/add_document_to_index_task.py View File

@@ -37,6 +37,10 @@ def add_document_to_index_task(dataset_document_id: str):
indexing_cache_key = "document_{}_indexing".format(dataset_document.id)

try:
dataset = dataset_document.dataset
if not dataset:
raise Exception(f"Document {dataset_document.id} dataset {dataset_document.dataset_id} doesn't exist.")

segments = (
db.session.query(DocumentSegment)
.filter(
@@ -77,11 +81,6 @@ def add_document_to_index_task(dataset_document_id: str):
document.children = child_documents
documents.append(document)

dataset = dataset_document.dataset

if not dataset:
raise Exception("Document has no dataset")

index_type = dataset.doc_form
index_processor = IndexProcessorFactory(index_type).init_index_processor()
index_processor.load(dataset, documents)

Loading…
Cancel
Save