From 9fc35f066f2aec338535d849a61aecf761ca6680 Mon Sep 17 00:00:00 2001 From: Dallas98 <990259227@qq.com> Date: Mon, 1 Dec 2025 17:04:52 +0800 Subject: [PATCH] feat: Add original file ID to document metadata in RagEtlService --- .../datamate/rag/indexer/infrastructure/event/RagEtlService.java | 1 + 1 file changed, 1 insertion(+) diff --git a/backend/services/rag-indexer-service/src/main/java/com/datamate/rag/indexer/infrastructure/event/RagEtlService.java b/backend/services/rag-indexer-service/src/main/java/com/datamate/rag/indexer/infrastructure/event/RagEtlService.java index f1c9f1d..53c78fa 100644 --- a/backend/services/rag-indexer-service/src/main/java/com/datamate/rag/indexer/infrastructure/event/RagEtlService.java +++ b/backend/services/rag-indexer-service/src/main/java/com/datamate/rag/indexer/infrastructure/event/RagEtlService.java @@ -106,6 +106,7 @@ public class RagEtlService { document = new HtmlToTextDocumentTransformer().transform(document); } document.metadata().put("rag_file_id", ragFile.getId()); + document.metadata().put("original_file_id", ragFile.getFileId()); // 使用文档分块器对文档进行分块 DocumentSplitter splitter = documentSplitter(event.addFilesReq()); List split = splitter.split(document);