langchain/libs/community/tests/integration_tests/cache/test_momento_cache.py

"""Test Momento cache functionality.

To run tests, set the environment variable MOMENTO_AUTH_TOKEN to a valid
Momento auth token. This can be obtained by signing up for a free
Momento account at https://gomomento.com/.
"""
from __future__ import annotations

import uuid
from datetime import timedelta
from typing import Iterator

import pytest
from langchain.globals import set_llm_cache
from langchain_core.outputs import Generation, LLMResult

from langchain_community.cache import MomentoCache
from tests.unit_tests.llms.fake_llm import FakeLLM


def random_string() -> str:
    return str(uuid.uuid4())


@pytest.fixture(scope="module")
def momento_cache() -> Iterator[MomentoCache]:
    from momento import CacheClient, Configurations, CredentialProvider

    cache_name = f"langchain-test-cache-{random_string()}"
    client = CacheClient(
        Configurations.Laptop.v1(),
        CredentialProvider.from_environment_variable("MOMENTO_API_KEY"),
        default_ttl=timedelta(seconds=30),
    )
    try:
        llm_cache = MomentoCache(client, cache_name)
        set_llm_cache(llm_cache)
        yield llm_cache
    finally:
        client.delete_cache(cache_name)


def test_invalid_ttl() -> None:
    from momento import CacheClient, Configurations, CredentialProvider

    client = CacheClient(
        Configurations.Laptop.v1(),
        CredentialProvider.from_environment_variable("MOMENTO_API_KEY"),
        default_ttl=timedelta(seconds=30),
    )
    with pytest.raises(ValueError):
        MomentoCache(client, cache_name=random_string(), ttl=timedelta(seconds=-1))


def test_momento_cache_miss(momento_cache: MomentoCache) -> None:
    llm = FakeLLM()
    stub_llm_output = LLMResult(generations=[[Generation(text="foo")]])
    assert llm.generate([random_string()]) == stub_llm_output


@pytest.mark.parametrize(
    "prompts,  generations",
    [
        # Single prompt, single generation
        ([random_string()], [[random_string()]]),
        # Single prompt, multiple generations
        ([random_string()], [[random_string(), random_string()]]),
        # Single prompt, multiple generations
        ([random_string()], [[random_string(), random_string(), random_string()]]),
        # Multiple prompts, multiple generations
        (
            [random_string(), random_string()],
            [[random_string()], [random_string(), random_string()]],
        ),
    ],
)
def test_momento_cache_hit(
    momento_cache: MomentoCache, prompts: list[str], generations: list[list[str]]
) -> None:
    llm = FakeLLM()
    params = llm.dict()
    params["stop"] = None
    llm_string = str(sorted([(k, v) for k, v in params.items()]))

    llm_generations = [
        [
            Generation(text=generation, generation_info=params)
            for generation in prompt_i_generations
        ]
        for prompt_i_generations in generations
    ]
    for prompt_i, llm_generations_i in zip(prompts, llm_generations):
        momento_cache.update(prompt_i, llm_string, llm_generations_i)

    assert llm.generate(prompts) == LLMResult(
        generations=llm_generations, llm_output={}
    )
feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`"""Test Momento cache functionality.`

			`To run tests, set the environment variable MOMENTO_AUTH_TOKEN to a valid`
			`Momento auth token. This can be obtained by signing up for a free`
			`Momento account at https://gomomento.com/.`
			`"""`
			`from __future__ import annotations`

			`import uuid`
			`from datetime import timedelta`
			`from typing import Iterator`

			`import pytest`
multiple: langchain 0.2 in master (#21191) 0.2rc migrations - [x] Move memory - [x] Move remaining retrievers - [x] graph_qa chains - [x] some dependency from evaluation code potentially on math utils - [x] Move openapi chain from `langchain.chains.api.openapi` to `langchain_community.chains.openapi` - [x] Migrate `langchain.chains.ernie_functions` to `langchain_community.chains.ernie_functions` - [x] migrate `langchain/chains/llm_requests.py` to `langchain_community.chains.llm_requests` - [x] Moving `langchain_community.cross_enoders.base:BaseCrossEncoder` -> `langchain_community.retrievers.document_compressors.cross_encoder:BaseCrossEncoder` (namespace not ideal, but it needs to be moved to `langchain` to avoid circular deps) - [x] unit tests langchain -- add pytest.mark.community to some unit tests that will stay in langchain - [x] unit tests community -- move unit tests that depend on community to community - [x] mv integration tests that depend on community to community - [x] mypy checks Other todo - [x] Make deprecation warnings not noisy (need to use warn deprecated and check that things are implemented properly) - [x] Update deprecation messages with timeline for code removal (likely we actually won't be removing things until 0.4 release) -- will give people more time to transition their code. - [ ] Add information to deprecation warning to show users how to migrate their code base using langchain-cli - [ ] Remove any unnecessary requirements in langchain (e.g., is SQLALchemy required?) --------- Co-authored-by: Erick Friis <erick@langchain.dev> 2024-05-08 20:46:52 +00:00			`from langchain.globals import set_llm_cache`
REFACTOR: Refactor langchain_core (#13627) Changes: - remove langchain_core/schema since no clear distinction b/n schema and non-schema modules - make every module that doesn't end in -y plural - where easy have 1-2 classes per file - no more than one level of nesting in directories - only import from top level core modules in langchain 2023-11-21 16:35:29 +00:00			`from langchain_core.outputs import Generation, LLMResult`
feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00
multiple: langchain 0.2 in master (#21191) 0.2rc migrations - [x] Move memory - [x] Move remaining retrievers - [x] graph_qa chains - [x] some dependency from evaluation code potentially on math utils - [x] Move openapi chain from `langchain.chains.api.openapi` to `langchain_community.chains.openapi` - [x] Migrate `langchain.chains.ernie_functions` to `langchain_community.chains.ernie_functions` - [x] migrate `langchain/chains/llm_requests.py` to `langchain_community.chains.llm_requests` - [x] Moving `langchain_community.cross_enoders.base:BaseCrossEncoder` -> `langchain_community.retrievers.document_compressors.cross_encoder:BaseCrossEncoder` (namespace not ideal, but it needs to be moved to `langchain` to avoid circular deps) - [x] unit tests langchain -- add pytest.mark.community to some unit tests that will stay in langchain - [x] unit tests community -- move unit tests that depend on community to community - [x] mv integration tests that depend on community to community - [x] mypy checks Other todo - [x] Make deprecation warnings not noisy (need to use warn deprecated and check that things are implemented properly) - [x] Update deprecation messages with timeline for code removal (likely we actually won't be removing things until 0.4 release) -- will give people more time to transition their code. - [ ] Add information to deprecation warning to show users how to migrate their code base using langchain-cli - [ ] Remove any unnecessary requirements in langchain (e.g., is SQLALchemy required?) --------- Co-authored-by: Erick Friis <erick@langchain.dev> 2024-05-08 20:46:52 +00:00			`from langchain_community.cache import MomentoCache`
feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`from tests.unit_tests.llms.fake_llm import FakeLLM`


			`def random_string() -> str:`
			`return str(uuid.uuid4())`


			`@pytest.fixture(scope="module")`
			`def momento_cache() -> Iterator[MomentoCache]:`
scheduled tests GHA (#8879) Adding scheduled daily GHA that runs marked integration tests. To start just marking some tests in test_openai 2023-08-08 21:55:25 +00:00			`from momento import CacheClient, Configurations, CredentialProvider`

feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`cache_name = f"langchain-test-cache-{random_string()}"`
			`client = CacheClient(`
			`Configurations.Laptop.v1(),`
feat: add momento vector index as a vector store provider (#11567) Description: - Added Momento Vector Index (MVI) as a vector store provider. This includes an implementation with docstrings, integration tests, a notebook, and documentation on the docs pages. - Updated the Momento dependency in pyproject.toml and the lock file to enable access to MVI. - Refactored the Momento cache and chat history session store to prefer using "MOMENTO_API_KEY" over "MOMENTO_AUTH_TOKEN" for consistency with MVI. This change is backwards compatible with the previous "auth_token" variable usage. Updated the code and tests accordingly. Dependencies: - Updated Momento dependency in pyproject.toml. Testing: - Run the integration tests with a Momento API key. Get one at the [Momento Console](https://console.gomomento.com) for free. MVI is available in AWS us-west-2 with a superuser key. - `MOMENTO_API_KEY=<your key> poetry run pytest tests/integration_tests/vectorstores/test_momento_vector_index.py` Tag maintainer: @eyurtsev Twitter handle: Please mention @momentohq for this addition to langchain. With the integration of Momento Vector Index, Momento caching, and session store, Momento provides serverless support for the core langchain data needs. Also mention @mlonml for the integration. 2023-10-09 21:02:59 +00:00			`CredentialProvider.from_environment_variable("MOMENTO_API_KEY"),`
feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`default_ttl=timedelta(seconds=30),`
			`)`
			`try:`
			`llm_cache = MomentoCache(client, cache_name)`
use get_llm_cache and set_llm_cache (#11741) Co-authored-by: Bagatur <baskaryan@gmail.com> 2023-10-14 16:29:30 +00:00			`set_llm_cache(llm_cache)`
feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`yield llm_cache`
			`finally:`
			`client.delete_cache(cache_name)`


			`def test_invalid_ttl() -> None:`
scheduled tests GHA (#8879) Adding scheduled daily GHA that runs marked integration tests. To start just marking some tests in test_openai 2023-08-08 21:55:25 +00:00			`from momento import CacheClient, Configurations, CredentialProvider`

feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`client = CacheClient(`
			`Configurations.Laptop.v1(),`
feat: add momento vector index as a vector store provider (#11567) Description: - Added Momento Vector Index (MVI) as a vector store provider. This includes an implementation with docstrings, integration tests, a notebook, and documentation on the docs pages. - Updated the Momento dependency in pyproject.toml and the lock file to enable access to MVI. - Refactored the Momento cache and chat history session store to prefer using "MOMENTO_API_KEY" over "MOMENTO_AUTH_TOKEN" for consistency with MVI. This change is backwards compatible with the previous "auth_token" variable usage. Updated the code and tests accordingly. Dependencies: - Updated Momento dependency in pyproject.toml. Testing: - Run the integration tests with a Momento API key. Get one at the [Momento Console](https://console.gomomento.com) for free. MVI is available in AWS us-west-2 with a superuser key. - `MOMENTO_API_KEY=<your key> poetry run pytest tests/integration_tests/vectorstores/test_momento_vector_index.py` Tag maintainer: @eyurtsev Twitter handle: Please mention @momentohq for this addition to langchain. With the integration of Momento Vector Index, Momento caching, and session store, Momento provides serverless support for the core langchain data needs. Also mention @mlonml for the integration. 2023-10-09 21:02:59 +00:00			`CredentialProvider.from_environment_variable("MOMENTO_API_KEY"),`
feat: add Momento as a standard cache and chat message history provider (#5221) # Add Momento as a standard cache and chat message history provider This PR adds Momento as a standard caching provider. Implements the interface, adds integration tests, and documentation. We also add Momento as a chat history message provider along with integration tests, and documentation. [Momento](https://www.gomomento.com/) is a fully serverless cache. Similar to S3 or DynamoDB, it requires zero configuration, infrastructure management, and is instantly available. Users sign up for free and get 50GB of data in/out for free every month. ## Before submitting ✅ We have added documentation, notebooks, and integration tests demonstrating usage. Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-26 02:13:21 +00:00			`default_ttl=timedelta(seconds=30),`
			`)`
			`with pytest.raises(ValueError):`
			`MomentoCache(client, cache_name=random_string(), ttl=timedelta(seconds=-1))`


			`def test_momento_cache_miss(momento_cache: MomentoCache) -> None:`
			`llm = FakeLLM()`
			`stub_llm_output = LLMResult(generations=[[Generation(text="foo")]])`
			`assert llm.generate([random_string()]) == stub_llm_output`


			`@pytest.mark.parametrize(`
			`"prompts, generations",`
			`[`
			`# Single prompt, single generation`
			`([random_string()], [[random_string()]]),`
			`# Single prompt, multiple generations`
			`([random_string()], [[random_string(), random_string()]]),`
			`# Single prompt, multiple generations`
			`([random_string()], [[random_string(), random_string(), random_string()]]),`
			`# Multiple prompts, multiple generations`
			`(`
			`[random_string(), random_string()],`
			`[[random_string()], [random_string(), random_string()]],`
			`),`
			`],`
			`)`
			`def test_momento_cache_hit(`
			`momento_cache: MomentoCache, prompts: list[str], generations: list[list[str]]`
			`) -> None:`
			`llm = FakeLLM()`
			`params = llm.dict()`
			`params["stop"] = None`
			`llm_string = str(sorted([(k, v) for k, v in params.items()]))`

			`llm_generations = [`
			`[`
			`Generation(text=generation, generation_info=params)`
			`for generation in prompt_i_generations`
			`]`
			`for prompt_i_generations in generations`
			`]`
			`for prompt_i, llm_generations_i in zip(prompts, llm_generations):`
			`momento_cache.update(prompt_i, llm_string, llm_generations_i)`

			`assert llm.generate(prompts) == LLMResult(`
			`generations=llm_generations, llm_output={}`
			`)`