diff --git a/tests/integration_tests/document_loaders/test_dir_text_loader.py b/tests/integration_tests/document_loaders/test_dir_text_loader.py deleted file mode 100644 index 3f179ce3..00000000 --- a/tests/integration_tests/document_loaders/test_dir_text_loader.py +++ /dev/null @@ -1,25 +0,0 @@ -from pathlib import Path - -import pytest - -from langchain.document_loaders import DirectoryLoader, TextLoader - - -@pytest.mark.requires("chardet") -def test_text_loader() -> None: - """Test text loader.""" - path = Path(__file__).parent.parent / "examples" - files = path.glob("**/*.txt") - loader = DirectoryLoader(str(path), glob="**/*.txt", loader_cls=TextLoader) - loader_detect_encoding = DirectoryLoader( - str(path), - glob="**/*.txt", - loader_kwargs={"autodetect_encoding": True}, - loader_cls=TextLoader, - ) - - with pytest.raises((UnicodeDecodeError, RuntimeError)): - loader.load() - - docs = loader_detect_encoding.load() - assert len(docs) == len(list(files)) diff --git a/tests/unit_tests/document_loader/test_text_loader.py b/tests/unit_tests/document_loader/test_text_loader.py new file mode 100644 index 00000000..79187ed9 --- /dev/null +++ b/tests/unit_tests/document_loader/test_text_loader.py @@ -0,0 +1,26 @@ +from pathlib import Path + +import pytest + +from langchain.document_loaders import DirectoryLoader, TextLoader + +class TestTextLoader: + + @pytest.mark.requires("chardet") + def test_load_directory(self) -> None: + """Test text loader.""" + path = Path(__file__).parent.parent / "examples" + files = path.glob("**/*.txt") + loader = DirectoryLoader(str(path), glob="**/*.txt", loader_cls=TextLoader) + loader_detect_encoding = DirectoryLoader( + str(path), + glob="**/*.txt", + loader_kwargs={"autodetect_encoding": True}, + loader_cls=TextLoader, + ) + + with pytest.raises((UnicodeDecodeError, RuntimeError)): + loader.load() + + docs = loader_detect_encoding.load() + assert len(docs) == len(list(files)) diff --git a/tests/integration_tests/examples/example-non-utf8.txt b/tests/unit_tests/examples/example-non-utf8.txt similarity index 100% rename from tests/integration_tests/examples/example-non-utf8.txt rename to tests/unit_tests/examples/example-non-utf8.txt diff --git a/tests/integration_tests/examples/example-utf8.txt b/tests/unit_tests/examples/example-utf8.txt similarity index 100% rename from tests/integration_tests/examples/example-utf8.txt rename to tests/unit_tests/examples/example-utf8.txt