Files
DataMate/runtime/ops/mapper/knowledge_relation_slice/knowledge_slice.py
2025-10-21 23:00:48 +08:00

24 lines
704 B
Python

#!/usr/bin/python3
# -*- coding: utf-8 -*-
from typing import List
from loguru import logger
from datamate.common.utils.text_splitter import TextSplitter
class TextSegmentationOperator:
def __init__(self, chunk_size, chunk_overlap):
try:
self.text_splitter = TextSplitter(-1, chunk_size, chunk_overlap)
except Exception as err:
logger.exception(f"init text splitter failed, error is: {err}")
raise err
def process(self, input_data: str) -> List[str]:
if input_data.strip() == "":
logger.info("input text is empty, return empty chunks.")
return []
return self.text_splitter.split_text(input_data)