feat: Add original file ID to document metadata in RagEtlService

This commit is contained in:
Dallas98
2025-12-01 17:04:52 +08:00
parent bb3345268e
commit 9fc35f066f

View File

@@ -106,6 +106,7 @@ public class RagEtlService {
document = new HtmlToTextDocumentTransformer().transform(document);
}
document.metadata().put("rag_file_id", ragFile.getId());
document.metadata().put("original_file_id", ragFile.getFileId());
// 使用文档分块器对文档进行分块
DocumentSplitter splitter = documentSplitter(event.addFilesReq());
List<TextSegment> split = splitter.split(document);