You've already forked DataMate
refactor(annotation): 移除文本内容获取相关功能
- 删除了 fetch_text_content_via_download_api 导入 - 移除了 TEXT 类型数据集的文本内容获取逻辑 - 删除了 _append_annotation_to_content 方法实现 - 简化了知识同步服务的内容处理流程
This commit is contained in:
@@ -11,7 +11,6 @@ from sqlalchemy.ext.asyncio import AsyncSession
|
|||||||
from app.core.config import settings
|
from app.core.config import settings
|
||||||
from app.core.logging import get_logger
|
from app.core.logging import get_logger
|
||||||
from app.db.models import Dataset, DatasetFiles, LabelingProject
|
from app.db.models import Dataset, DatasetFiles, LabelingProject
|
||||||
from app.module.annotation.service.text_fetcher import fetch_text_content_via_download_api
|
|
||||||
|
|
||||||
logger = get_logger(__name__)
|
logger = get_logger(__name__)
|
||||||
|
|
||||||
@@ -254,16 +253,6 @@ class KnowledgeSyncService:
|
|||||||
content_type = "MARKDOWN"
|
content_type = "MARKDOWN"
|
||||||
|
|
||||||
content = annotation_json
|
content = annotation_json
|
||||||
if dataset_type == "TEXT":
|
|
||||||
try:
|
|
||||||
content = await fetch_text_content_via_download_api(
|
|
||||||
project.dataset_id,
|
|
||||||
str(file_record.id),
|
|
||||||
)
|
|
||||||
content = self._append_annotation_to_content(content, annotation_json, content_type)
|
|
||||||
except Exception as exc:
|
|
||||||
logger.warning("读取文本失败,改为仅存标注JSON:%s", exc)
|
|
||||||
content = annotation_json
|
|
||||||
|
|
||||||
payload: Dict[str, Any] = {
|
payload: Dict[str, Any] = {
|
||||||
"title": title,
|
"title": title,
|
||||||
@@ -294,13 +283,6 @@ class KnowledgeSyncService:
|
|||||||
extension = file_type
|
extension = file_type
|
||||||
return extension.lower() in {"md", "markdown"}
|
return extension.lower() in {"md", "markdown"}
|
||||||
|
|
||||||
def _append_annotation_to_content(self, content: str, annotation_json: str, content_type: str) -> str:
|
|
||||||
if content_type == "MARKDOWN":
|
|
||||||
return (
|
|
||||||
f"{content}\n\n---\n\n## 标注结果\n\n```json\n"
|
|
||||||
f"{annotation_json}\n```")
|
|
||||||
return f"{content}\n\n---\n\n标注结果(JSON):\n{annotation_json}"
|
|
||||||
|
|
||||||
def _strip_extension(self, file_name: str) -> str:
|
def _strip_extension(self, file_name: str) -> str:
|
||||||
if not file_name:
|
if not file_name:
|
||||||
return ""
|
return ""
|
||||||
|
|||||||
Reference in New Issue
Block a user