2022-11-07 13:46:44 +00:00
|
|
|
"""Test huggingface embeddings."""
|
2022-11-09 21:26:58 +00:00
|
|
|
|
2023-02-02 16:44:02 +00:00
|
|
|
from langchain.embeddings.huggingface import (
|
|
|
|
HuggingFaceEmbeddings,
|
|
|
|
HuggingFaceInstructEmbeddings,
|
|
|
|
)
|
2022-11-07 13:46:44 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_huggingface_embedding_documents() -> None:
|
|
|
|
"""Test huggingface embeddings."""
|
|
|
|
documents = ["foo bar"]
|
|
|
|
embedding = HuggingFaceEmbeddings()
|
|
|
|
output = embedding.embed_documents(documents)
|
|
|
|
assert len(output) == 1
|
|
|
|
assert len(output[0]) == 768
|
|
|
|
|
|
|
|
|
|
|
|
def test_huggingface_embedding_query() -> None:
|
|
|
|
"""Test huggingface embeddings."""
|
|
|
|
document = "foo bar"
|
2023-05-02 03:27:41 +00:00
|
|
|
embedding = HuggingFaceEmbeddings(encode_kwargs={"batch_size": 16})
|
2022-11-07 13:46:44 +00:00
|
|
|
output = embedding.embed_query(document)
|
|
|
|
assert len(output) == 768
|
2023-02-02 16:44:02 +00:00
|
|
|
|
|
|
|
|
|
|
|
def test_huggingface_instructor_embedding_documents() -> None:
|
|
|
|
"""Test huggingface embeddings."""
|
|
|
|
documents = ["foo bar"]
|
|
|
|
embedding = HuggingFaceInstructEmbeddings()
|
|
|
|
output = embedding.embed_documents(documents)
|
|
|
|
assert len(output) == 1
|
|
|
|
assert len(output[0]) == 768
|
|
|
|
|
|
|
|
|
|
|
|
def test_huggingface_instructor_embedding_query() -> None:
|
|
|
|
"""Test huggingface embeddings."""
|
|
|
|
query = "foo bar"
|
|
|
|
embedding = HuggingFaceInstructEmbeddings()
|
|
|
|
output = embedding.embed_query(query)
|
|
|
|
assert len(output) == 768
|