mirror of
https://github.com/hwchase17/langchain
synced 2024-11-08 07:10:35 +00:00
00c6ec8a2d
# Fix Telegram API loader + add tests. I was testing this integration and it was broken with next error: ```python message_threads = loader._get_message_threads(df) KeyError: False ``` Also, this particular loader didn't have any tests / related group in poetry, so I added those as well. @hwchase17 / @eyurtsev please take a look on this fix PR. --------- Co-authored-by: Dev 2049 <dev.dev2049@gmail.com>
29 lines
921 B
Python
29 lines
921 B
Python
"""Test Base Schema of documents."""
|
|
from typing import Iterator
|
|
|
|
from langchain.document_loaders.base import BaseBlobParser
|
|
from langchain.document_loaders.blob_loaders import Blob
|
|
from langchain.schema import Document
|
|
|
|
|
|
def test_base_blob_parser() -> None:
|
|
"""Verify that the eager method is hooked up to the lazy method by default."""
|
|
|
|
class MyParser(BaseBlobParser):
|
|
"""A simple parser that returns a single document."""
|
|
|
|
def lazy_parse(self, blob: Blob) -> Iterator[Document]:
|
|
"""Lazy parsing interface."""
|
|
yield Document(
|
|
page_content="foo",
|
|
)
|
|
|
|
parser = MyParser()
|
|
|
|
assert isinstance(parser.lazy_parse(Blob(data="who?")), Iterator)
|
|
|
|
# We're verifying that the eager method is hooked up to the lazy method by default.
|
|
docs = parser.parse(Blob(data="who?"))
|
|
assert len(docs) == 1
|
|
assert docs[0].page_content == "foo"
|