mirror of
https://github.com/hwchase17/langchain
synced 2024-11-06 03:20:49 +00:00
b24472eae3
### Summary Adds `UnstructuredOrgModeLoader` for processing [Org-mode](https://en.wikipedia.org/wiki/Org-mode) documents. ### Testing ```python from langchain.document_loaders import UnstructuredOrgModeLoader loader = UnstructuredOrgModeLoader( file_path="example_data/README.org", mode="elements" ) docs = loader.load() print(docs[0]) ``` ### Reviewers - @rlancemartin - @eyurtsev - @hwchase17
16 lines
432 B
Python
16 lines
432 B
Python
import os
|
|
from pathlib import Path
|
|
|
|
from langchain.document_loaders import UnstructuredOrgModeLoader
|
|
|
|
EXAMPLE_DIRECTORY = file_path = Path(__file__).parent.parent / "examples"
|
|
|
|
|
|
def test_unstructured_org_mode_loader() -> None:
|
|
"""Test unstructured loader."""
|
|
file_path = os.path.join(EXAMPLE_DIRECTORY, "README.org")
|
|
loader = UnstructuredOrgModeLoader(str(file_path))
|
|
docs = loader.load()
|
|
|
|
assert len(docs) == 1
|