chore: skip document segments fetching with non-existed dataset of DatasetDocument in add_document_to_index_task task (#17784)

This commit is contained in:
Bowen Liang 2025-04-10 17:12:48 +08:00 committed by GitHub
parent 29720b7360
commit 636a0ba37f
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -37,6 +37,10 @@ def add_document_to_index_task(dataset_document_id: str):
indexing_cache_key = "document_{}_indexing".format(dataset_document.id) indexing_cache_key = "document_{}_indexing".format(dataset_document.id)
try: try:
dataset = dataset_document.dataset
if not dataset:
raise Exception(f"Document {dataset_document.id} dataset {dataset_document.dataset_id} doesn't exist.")
segments = ( segments = (
db.session.query(DocumentSegment) db.session.query(DocumentSegment)
.filter( .filter(
@ -77,11 +81,6 @@ def add_document_to_index_task(dataset_document_id: str):
document.children = child_documents document.children = child_documents
documents.append(document) documents.append(document)
dataset = dataset_document.dataset
if not dataset:
raise Exception("Document has no dataset")
index_type = dataset.doc_form index_type = dataset.doc_form
index_processor = IndexProcessorFactory(index_type).init_index_processor() index_processor = IndexProcessorFactory(index_type).init_index_processor()
index_processor.load(dataset, documents) index_processor.load(dataset, documents)