morphik-core/core/parser/base_parser.py
2024-11-24 14:29:25 -05:00

17 lines
485 B
Python

from abc import ABC, abstractmethod
from typing import List, Union
from fastapi import UploadFile
class BaseParser(ABC):
"""Base class for document parsing"""
@abstractmethod
async def split_text(self, text: str) -> List[str]:
"""Split plain text into chunks"""
pass
@abstractmethod
async def parse_file(self, file: Union[UploadFile, bytes], content_type: str) -> List[str]:
"""Parse file content into text chunks"""
pass