2023-07-18 16:57:24 +00:00
|
|
|
import pytest
|
2023-11-21 16:35:29 +00:00
|
|
|
from langchain_core.documents import Document
|
2023-07-18 16:57:24 +00:00
|
|
|
|
2023-12-11 21:53:30 +00:00
|
|
|
from langchain_community.embeddings import FakeEmbeddings
|
|
|
|
from langchain_community.retrievers.svm import SVMRetriever
|
2023-07-18 16:57:24 +00:00
|
|
|
|
|
|
|
|
|
|
|
class TestSVMRetriever:
|
|
|
|
@pytest.mark.requires("sklearn")
|
|
|
|
def test_from_texts(self) -> None:
|
|
|
|
input_texts = ["I have a pen.", "Do you have a pen?", "I have a bag."]
|
|
|
|
svm_retriever = SVMRetriever.from_texts(
|
|
|
|
texts=input_texts, embeddings=FakeEmbeddings(size=100)
|
|
|
|
)
|
|
|
|
assert len(svm_retriever.texts) == 3
|
|
|
|
|
|
|
|
@pytest.mark.requires("sklearn")
|
|
|
|
def test_from_documents(self) -> None:
|
|
|
|
input_docs = [
|
|
|
|
Document(page_content="I have a pen.", metadata={"foo": "bar"}),
|
|
|
|
Document(page_content="Do you have a pen?"),
|
|
|
|
Document(page_content="I have a bag."),
|
|
|
|
]
|
|
|
|
svm_retriever = SVMRetriever.from_documents(
|
|
|
|
documents=input_docs, embeddings=FakeEmbeddings(size=100)
|
|
|
|
)
|
|
|
|
assert len(svm_retriever.texts) == 3
|
2023-08-11 20:08:17 +00:00
|
|
|
|
|
|
|
@pytest.mark.requires("sklearn")
|
|
|
|
def test_metadata_persists(self) -> None:
|
|
|
|
input_docs = [
|
|
|
|
Document(page_content="I have a pen.", metadata={"foo": "bar"}),
|
|
|
|
Document(page_content="How about you?", metadata={"foo": "baz"}),
|
|
|
|
Document(page_content="I have a bag.", metadata={"foo": "qux"}),
|
|
|
|
]
|
|
|
|
svm_retriever = SVMRetriever.from_documents(
|
|
|
|
documents=input_docs, embeddings=FakeEmbeddings(size=100)
|
|
|
|
)
|
|
|
|
query = "Have anything?"
|
|
|
|
output_docs = svm_retriever.get_relevant_documents(query=query)
|
|
|
|
for doc in output_docs:
|
|
|
|
assert "foo" in doc.metadata
|