langchain/libs/community/tests/integration_tests/retrievers/test_pubmed.py

"""Integration test for PubMed API Wrapper."""
from typing import List

import pytest
from langchain_core.documents import Document

from langchain_community.retrievers import PubMedRetriever


@pytest.fixture
def retriever() -> PubMedRetriever:
    return PubMedRetriever()


def assert_docs(docs: List[Document]) -> None:
    for doc in docs:
        assert doc.metadata
        assert set(doc.metadata) == {
            "Copyright Information",
            "uid",
            "Title",
            "Published",
        }


def test_load_success(retriever: PubMedRetriever) -> None:
    docs = retriever.get_relevant_documents(query="chatgpt")
    assert len(docs) == 3
    assert_docs(docs)


def test_load_success_top_k_results(retriever: PubMedRetriever) -> None:
    retriever.top_k_results = 2
    docs = retriever.get_relevant_documents(query="chatgpt")
    assert len(docs) == 2
    assert_docs(docs)


def test_load_no_result(retriever: PubMedRetriever) -> None:
    docs = retriever.get_relevant_documents("1605.08386WWW")
    assert not docs
`PubMed` document loader (#8893) - added `PubMed Document Loader` artifacts; ut-s; examples - fixed `PubMed utility`; ut-s @hwchase17 2023-08-08 18:26:03 +00:00			`"""Integration test for PubMed API Wrapper."""`
			`from typing import List`

			`import pytest`
REFACTOR: Refactor langchain_core (#13627) Changes: - remove langchain_core/schema since no clear distinction b/n schema and non-schema modules - make every module that doesn't end in -y plural - where easy have 1-2 classes per file - no more than one level of nesting in directories - only import from top level core modules in langchain 2023-11-21 16:35:29 +00:00			`from langchain_core.documents import Document`
`PubMed` document loader (#8893) - added `PubMed Document Loader` artifacts; ut-s; examples - fixed `PubMed utility`; ut-s @hwchase17 2023-08-08 18:26:03 +00:00
community[major], core[patch], langchain[patch], experimental[patch]: Create langchain-community (#14463) Moved the following modules to new package langchain-community in a backwards compatible fashion: ``` mv langchain/langchain/adapters community/langchain_community mv langchain/langchain/callbacks community/langchain_community/callbacks mv langchain/langchain/chat_loaders community/langchain_community mv langchain/langchain/chat_models community/langchain_community mv langchain/langchain/document_loaders community/langchain_community mv langchain/langchain/docstore community/langchain_community mv langchain/langchain/document_transformers community/langchain_community mv langchain/langchain/embeddings community/langchain_community mv langchain/langchain/graphs community/langchain_community mv langchain/langchain/llms community/langchain_community mv langchain/langchain/memory/chat_message_histories community/langchain_community mv langchain/langchain/retrievers community/langchain_community mv langchain/langchain/storage community/langchain_community mv langchain/langchain/tools community/langchain_community mv langchain/langchain/utilities community/langchain_community mv langchain/langchain/vectorstores community/langchain_community mv langchain/langchain/agents/agent_toolkits community/langchain_community mv langchain/langchain/cache.py community/langchain_community mv langchain/langchain/adapters community/langchain_community mv langchain/langchain/callbacks community/langchain_community/callbacks mv langchain/langchain/chat_loaders community/langchain_community mv langchain/langchain/chat_models community/langchain_community mv langchain/langchain/document_loaders community/langchain_community mv langchain/langchain/docstore community/langchain_community mv langchain/langchain/document_transformers community/langchain_community mv langchain/langchain/embeddings community/langchain_community mv langchain/langchain/graphs community/langchain_community mv langchain/langchain/llms community/langchain_community mv langchain/langchain/memory/chat_message_histories community/langchain_community mv langchain/langchain/retrievers community/langchain_community mv langchain/langchain/storage community/langchain_community mv langchain/langchain/tools community/langchain_community mv langchain/langchain/utilities community/langchain_community mv langchain/langchain/vectorstores community/langchain_community mv langchain/langchain/agents/agent_toolkits community/langchain_community mv langchain/langchain/cache.py community/langchain_community ``` Moved the following to core ``` mv langchain/langchain/utils/json_schema.py core/langchain_core/utils mv langchain/langchain/utils/html.py core/langchain_core/utils mv langchain/langchain/utils/strings.py core/langchain_core/utils cat langchain/langchain/utils/env.py >> core/langchain_core/utils/env.py rm langchain/langchain/utils/env.py ``` See .scripts/community_split/script_integrations.sh for all changes 2023-12-11 21:53:30 +00:00			`from langchain_community.retrievers import PubMedRetriever`
`PubMed` document loader (#8893) - added `PubMed Document Loader` artifacts; ut-s; examples - fixed `PubMed utility`; ut-s @hwchase17 2023-08-08 18:26:03 +00:00

			`@pytest.fixture`
			`def retriever() -> PubMedRetriever:`
			`return PubMedRetriever()`


			`def assert_docs(docs: List[Document]) -> None:`
			`for doc in docs:`
			`assert doc.metadata`
			`assert set(doc.metadata) == {`
			`"Copyright Information",`
			`"uid",`
			`"Title",`
			`"Published",`
			`}`


			`def test_load_success(retriever: PubMedRetriever) -> None:`
			`docs = retriever.get_relevant_documents(query="chatgpt")`
			`assert len(docs) == 3`
			`assert_docs(docs)`


			`def test_load_success_top_k_results(retriever: PubMedRetriever) -> None:`
			`retriever.top_k_results = 2`
			`docs = retriever.get_relevant_documents(query="chatgpt")`
			`assert len(docs) == 2`
			`assert_docs(docs)`


			`def test_load_no_result(retriever: PubMedRetriever) -> None:`
			`docs = retriever.get_relevant_documents("1605.08386WWW")`
			`assert not docs`