From 9f28a48a92cd054741ebc55a43bda292279c3df9 Mon Sep 17 00:00:00 2001 From: Jyong <76649700+JohnJyong@users.noreply.github.com> Date: Tue, 18 Jul 2023 15:02:33 +0800 Subject: [PATCH] index add to db when dataset updated (#588) --- api/tasks/deal_dataset_vector_index_task.py | 7 +++---- 1 file changed, 3 insertions(+), 4 deletions(-) diff --git a/api/tasks/deal_dataset_vector_index_task.py b/api/tasks/deal_dataset_vector_index_task.py index fac50510e5..7eac3b3271 100644 --- a/api/tasks/deal_dataset_vector_index_task.py +++ b/api/tasks/deal_dataset_vector_index_task.py @@ -44,14 +44,13 @@ def deal_dataset_vector_index_task(dataset_id: str, action: str): if dataset_documents: # save vector index index = IndexBuilder.get_index(dataset, 'high_quality', ignore_high_quality_check=True) + documents = [] for dataset_document in dataset_documents: # delete from vector index segments = db.session.query(DocumentSegment).filter( DocumentSegment.document_id == dataset_document.id, DocumentSegment.enabled == True ) .order_by(DocumentSegment.position.asc()).all() - - documents = [] for segment in segments: document = Document( page_content=segment.content, @@ -65,8 +64,8 @@ def deal_dataset_vector_index_task(dataset_id: str, action: str): documents.append(document) - # save vector index - index.add_texts(documents) + # save vector index + index.add_texts(documents) end_at = time.perf_counter() logging.info(