From a78bc507c0e8e7ff98b2bce8c6d113ce3f0e2e9b Mon Sep 17 00:00:00 2001 From: kenwoodjw Date: Tue, 18 Nov 2025 17:36:07 +0800 Subject: [PATCH] fix: dataset metadata counts when documents are deleted (#28305) Signed-off-by: kenwoodjw --- api/tasks/batch_clean_document_task.py | 10 ++++++++-- 1 file changed, 8 insertions(+), 2 deletions(-) diff --git a/api/tasks/batch_clean_document_task.py b/api/tasks/batch_clean_document_task.py index 447443703a..3e1bd16cc7 100644 --- a/api/tasks/batch_clean_document_task.py +++ b/api/tasks/batch_clean_document_task.py @@ -9,7 +9,7 @@ from core.rag.index_processor.index_processor_factory import IndexProcessorFacto from core.tools.utils.web_reader_tool import get_image_upload_file_ids from extensions.ext_database import db from extensions.ext_storage import storage -from models.dataset import Dataset, DocumentSegment +from models.dataset import Dataset, DatasetMetadataBinding, DocumentSegment from models.model import UploadFile logger = logging.getLogger(__name__) @@ -37,6 +37,11 @@ def batch_clean_document_task(document_ids: list[str], dataset_id: str, doc_form if not dataset: raise Exception("Document has no dataset") + db.session.query(DatasetMetadataBinding).where( + DatasetMetadataBinding.dataset_id == dataset_id, + DatasetMetadataBinding.document_id.in_(document_ids), + ).delete(synchronize_session=False) + segments = db.session.scalars( select(DocumentSegment).where(DocumentSegment.document_id.in_(document_ids)) ).all() @@ -71,7 +76,8 @@ def batch_clean_document_task(document_ids: list[str], dataset_id: str, doc_form except Exception: logger.exception("Delete file failed when document deleted, file_id: %s", file.id) db.session.delete(file) - db.session.commit() + + db.session.commit() end_at = time.perf_counter() logger.info(