DocsGPT/application/parser/remote/base.py

20 lines
657 B
Python
Raw Normal View History

2023-10-11 09:13:51 +00:00
"""Base reader class."""
from abc import abstractmethod
2024-02-28 16:52:58 +00:00
from typing import Any, List
2023-10-11 09:13:51 +00:00
from langchain.docstore.document import Document as LCDocument
from application.parser.schema.base import Document
class BaseRemote:
"""Utilities for loading data from a directory."""
@abstractmethod
def load_data(self, *args: Any, **load_kwargs: Any) -> List[Document]:
"""Load data from the input directory."""
def load_langchain_documents(self, **load_kwargs: Any) -> List[LCDocument]:
"""Load data in LangChain document format."""
docs = self.load_data(**load_kwargs)
return [d.to_langchain_format() for d in docs]