langchain/libs/community/tests/unit_tests/embeddings/test_infinity_local.py

import numpy as np
import pytest

from langchain_community.embeddings.infinity_local import InfinityEmbeddingsLocal

try:
    import torch  # noqa
    import infinity_emb  # noqa

    IMPORTED_TORCH = True
except ImportError:
    IMPORTED_TORCH = False


@pytest.mark.skipif(not IMPORTED_TORCH, reason="torch not installed")
@pytest.mark.asyncio
async def test_local_infinity_embeddings() -> None:
    embedder = InfinityEmbeddingsLocal(
        model="TaylorAI/bge-micro-v2",
        device="cpu",
        backend="torch",
        revision=None,
        batch_size=2,
        model_warmup=False,
    )

    async with embedder:
        embeddings = await embedder.aembed_documents(["text1", "text2", "text1"])
        assert len(embeddings) == 3
        # model has 384 dim output
        assert len(embeddings[0]) == 384
        assert len(embeddings[1]) == 384
        assert len(embeddings[2]) == 384
        # assert all different embeddings
        assert (np.array(embeddings[0]) - np.array(embeddings[1]) != 0).all()
        # assert identical embeddings, up to floating point error
        np.testing.assert_array_equal(embeddings[0], embeddings[2])


if __name__ == "__main__":
    import asyncio

    asyncio.run(test_local_infinity_embeddings())
community[minor]: infinity embedding local option (#17671) drop-in-replacement for sentence-transformers inference. https://github.com/langchain-ai/langchain/discussions/17670 tldr from the discussion above -> around a 4x-22x speedup over using SentenceTransformers / huggingface embeddings. For more info: https://github.com/michaelfeil/infinity (pure-python dependency) --------- Co-authored-by: Erick Friis <erick@langchain.dev> 2024-02-22 00:33:13 +00:00			`import numpy as np`
			`import pytest`

			`from langchain_community.embeddings.infinity_local import InfinityEmbeddingsLocal`

			`try:`
			`import torch # noqa`
			`import infinity_emb # noqa`

			`IMPORTED_TORCH = True`
			`except ImportError:`
			`IMPORTED_TORCH = False`


			`@pytest.mark.skipif(not IMPORTED_TORCH, reason="torch not installed")`
			`@pytest.mark.asyncio`
			`async def test_local_infinity_embeddings() -> None:`
			`embedder = InfinityEmbeddingsLocal(`
			`model="TaylorAI/bge-micro-v2",`
			`device="cpu",`
			`backend="torch",`
			`revision=None,`
			`batch_size=2,`
			`model_warmup=False,`
			`)`

			`async with embedder:`
			`embeddings = await embedder.aembed_documents(["text1", "text2", "text1"])`
			`assert len(embeddings) == 3`
			`# model has 384 dim output`
			`assert len(embeddings[0]) == 384`
			`assert len(embeddings[1]) == 384`
			`assert len(embeddings[2]) == 384`
			`# assert all different embeddings`
			`assert (np.array(embeddings[0]) - np.array(embeddings[1]) != 0).all()`
			`# assert identical embeddings, up to floating point error`
			`np.testing.assert_array_equal(embeddings[0], embeddings[2])`


			`if __name__ == "__main__":`
			`import asyncio`

			`asyncio.run(test_local_infinity_embeddings())`