langchain/tests/integration_tests/llms/test_openai.py

"""Test OpenAI API wrapper."""

from pathlib import Path
from typing import Generator

import pytest

from langchain.callbacks.manager import CallbackManager
from langchain.llms.loading import load_llm
from langchain.llms.openai import OpenAI, OpenAIChat
from langchain.schema import LLMResult
from tests.unit_tests.callbacks.fake_callback_handler import FakeCallbackHandler


def test_openai_call() -> None:
    """Test valid call to openai."""
    llm = OpenAI(max_tokens=10)
    output = llm("Say foo:")
    assert isinstance(output, str)


def test_openai_extra_kwargs() -> None:
    """Test extra kwargs to openai."""
    # Check that foo is saved in extra_kwargs.
    llm = OpenAI(foo=3, max_tokens=10)
    assert llm.max_tokens == 10
    assert llm.model_kwargs == {"foo": 3}

    # Test that if extra_kwargs are provided, they are added to it.
    llm = OpenAI(foo=3, model_kwargs={"bar": 2})
    assert llm.model_kwargs == {"foo": 3, "bar": 2}

    # Test that if provided twice it errors
    with pytest.raises(ValueError):
        OpenAI(foo=3, model_kwargs={"foo": 2})

    # Test that if explicit param is specified in kwargs it errors
    with pytest.raises(ValueError):
        OpenAI(model_kwargs={"temperature": 0.2})

    # Test that "model" cannot be specified in kwargs
    with pytest.raises(ValueError):
        OpenAI(model_kwargs={"model": "text-davinci-003"})


def test_openai_llm_output_contains_model_name() -> None:
    """Test llm_output contains model_name."""
    llm = OpenAI(max_tokens=10)
    llm_result = llm.generate(["Hello, how are you?"])
    assert llm_result.llm_output is not None
    assert llm_result.llm_output["model_name"] == llm.model_name


def test_openai_stop_valid() -> None:
    """Test openai stop logic on valid configuration."""
    query = "write an ordered list of five items"
    first_llm = OpenAI(stop="3", temperature=0)
    first_output = first_llm(query)
    second_llm = OpenAI(temperature=0)
    second_output = second_llm(query, stop=["3"])
    # Because it stops on new lines, shouldn't return anything
    assert first_output == second_output


def test_openai_stop_error() -> None:
    """Test openai stop logic on bad configuration."""
    llm = OpenAI(stop="3", temperature=0)
    with pytest.raises(ValueError):
        llm("write an ordered list of five items", stop=["\n"])


def test_saving_loading_llm(tmp_path: Path) -> None:
    """Test saving/loading an OpenAI LLM."""
    llm = OpenAI(max_tokens=10)
    llm.save(file_path=tmp_path / "openai.yaml")
    loaded_llm = load_llm(tmp_path / "openai.yaml")
    assert loaded_llm == llm


def test_openai_streaming() -> None:
    """Test streaming tokens from OpenAI."""
    llm = OpenAI(max_tokens=10)
    generator = llm.stream("I'm Pickle Rick")

    assert isinstance(generator, Generator)

    for token in generator:
        assert isinstance(token["choices"][0]["text"], str)


def test_openai_streaming_error() -> None:
    """Test error handling in stream."""
    llm = OpenAI(best_of=2)
    with pytest.raises(ValueError):
        llm.stream("I'm Pickle Rick")


def test_openai_streaming_best_of_error() -> None:
    """Test validation for streaming fails if best_of is not 1."""
    with pytest.raises(ValueError):
        OpenAI(best_of=2, streaming=True)


def test_openai_streaming_n_error() -> None:
    """Test validation for streaming fails if n is not 1."""
    with pytest.raises(ValueError):
        OpenAI(n=2, streaming=True)


def test_openai_streaming_multiple_prompts_error() -> None:
    """Test validation for streaming fails if multiple prompts are given."""
    with pytest.raises(ValueError):
        OpenAI(streaming=True).generate(["I'm Pickle Rick", "I'm Pickle Rick"])


def test_openai_streaming_call() -> None:
    """Test valid call to openai."""
    llm = OpenAI(max_tokens=10, streaming=True)
    output = llm("Say foo:")
    assert isinstance(output, str)


def test_openai_streaming_callback() -> None:
    """Test that streaming correctly invokes on_llm_new_token callback."""
    callback_handler = FakeCallbackHandler()
    callback_manager = CallbackManager([callback_handler])
    llm = OpenAI(
        max_tokens=10,
        streaming=True,
        temperature=0,
        callback_manager=callback_manager,
        verbose=True,
    )
    llm("Write me a sentence with 100 words.")
    assert callback_handler.llm_streams == 10


@pytest.mark.asyncio
async def test_openai_async_generate() -> None:
    """Test async generation."""
    llm = OpenAI(max_tokens=10)
    output = await llm.agenerate(["Hello, how are you?"])
    assert isinstance(output, LLMResult)


@pytest.mark.asyncio
async def test_openai_async_streaming_callback() -> None:
    """Test that streaming correctly invokes on_llm_new_token callback."""
    callback_handler = FakeCallbackHandler()
    callback_manager = CallbackManager([callback_handler])
    llm = OpenAI(
        max_tokens=10,
        streaming=True,
        temperature=0,
        callback_manager=callback_manager,
        verbose=True,
    )
    result = await llm.agenerate(["Write me a sentence with 100 words."])
    assert callback_handler.llm_streams == 10
    assert isinstance(result, LLMResult)


def test_openai_chat_wrong_class() -> None:
    """Test OpenAIChat with wrong class still works."""
    llm = OpenAI(model_name="gpt-3.5-turbo")
    output = llm("Say foo:")
    assert isinstance(output, str)


def test_openai_chat() -> None:
    """Test OpenAIChat."""
    llm = OpenAIChat(max_tokens=10)
    output = llm("Say foo:")
    assert isinstance(output, str)


def test_openai_chat_streaming() -> None:
    """Test OpenAIChat with streaming option."""
    llm = OpenAIChat(max_tokens=10, streaming=True)
    output = llm("Say foo:")
    assert isinstance(output, str)


def test_openai_chat_streaming_callback() -> None:
    """Test that streaming correctly invokes on_llm_new_token callback."""
    callback_handler = FakeCallbackHandler()
    callback_manager = CallbackManager([callback_handler])
    llm = OpenAIChat(
        max_tokens=10,
        streaming=True,
        temperature=0,
        callback_manager=callback_manager,
        verbose=True,
    )
    llm("Write me a sentence with 100 words.")
    assert callback_handler.llm_streams != 0


@pytest.mark.asyncio
async def test_openai_chat_async_generate() -> None:
    """Test async chat."""
    llm = OpenAIChat(max_tokens=10)
    output = await llm.agenerate(["Hello, how are you?"])
    assert isinstance(output, LLMResult)


@pytest.mark.asyncio
async def test_openai_chat_async_streaming_callback() -> None:
    """Test that streaming correctly invokes on_llm_new_token callback."""
    callback_handler = FakeCallbackHandler()
    callback_manager = CallbackManager([callback_handler])
    llm = OpenAIChat(
        max_tokens=10,
        streaming=True,
        temperature=0,
        callback_manager=callback_manager,
        verbose=True,
    )
    result = await llm.agenerate(["Write me a sentence with 100 words."])
    assert callback_handler.llm_streams != 0
    assert isinstance(result, LLMResult)


def test_openai_modelname_to_contextsize_valid() -> None:
    """Test model name to context size on a valid model."""
    assert OpenAI().modelname_to_contextsize("davinci") == 2049


def test_openai_modelname_to_contextsize_invalid() -> None:
    """Test model name to context size on an invalid model."""
    with pytest.raises(ValueError):
        OpenAI().modelname_to_contextsize("foobar")
initial commit 2022-10-24 21:51:15 +00:00			`"""Test OpenAI API wrapper."""`

Harrison/llm saving (#331) Co-authored-by: Akash Samant <70665700+asamant21@users.noreply.github.com> 2022-12-13 14:46:01 +00:00			`from pathlib import Path`
Support Streaming Tokens from OpenAI (#364) https://github.com/hwchase17/langchain/issues/363 @hwchase17 how much does this make you want to cry? 2022-12-17 15:02:58 +00:00			`from typing import Generator`
Harrison/llm saving (#331) Co-authored-by: Akash Samant <70665700+asamant21@users.noreply.github.com> 2022-12-13 14:46:01 +00:00
Harrison/arbitrary params (#186) 2022-11-25 04:01:20 +00:00			`import pytest`

Callbacks Refactor [base] (#3256) Co-authored-by: Nuno Campos <nuno@boringbits.io> Co-authored-by: Davis Chase <130488702+dev2049@users.noreply.github.com> Co-authored-by: Zander Chase <130414180+vowelparrot@users.noreply.github.com> Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> 2023-04-30 18:14:09 +00:00			`from langchain.callbacks.manager import CallbackManager`
Harrison/llm saving (#331) Co-authored-by: Akash Samant <70665700+asamant21@users.noreply.github.com> 2022-12-13 14:46:01 +00:00			`from langchain.llms.loading import load_llm`
add async and streaming support to `OpenAIChat` (#1378) title says it all 2023-03-02 05:55:43 +00:00			`from langchain.llms.openai import OpenAI, OpenAIChat`
Add asyncio support for LLM (OpenAI), Chain (LLMChain, LLMMathChain), and Agent (#841) Supporting asyncio in langchain primitives allows for users to run them concurrently and creates more seamless integration with asyncio-supported frameworks (FastAPI, etc.) Summary of changes: LLM * Add `agenerate` and `_agenerate` * Implement in OpenAI by leveraging `client.Completions.acreate` Chain * Add `arun`, `acall`, `_acall` * Implement them in `LLMChain` and `LLMMathChain` for now Agent * Refactor and leverage async chain and llm methods * Add ability for `Tools` to contain async coroutine * Implement async SerpaPI `arun` Create demo notebook. Open questions: * Should all the async stuff go in separate classes? I've seen both patterns (keeping the same class and having async and sync methods vs. having class separation) 2023-02-08 05:21:57 +00:00			`from langchain.schema import LLMResult`
Enable streaming for OpenAI LLM (#986) * Support a callback `on_llm_new_token` that users can implement when `OpenAI.streaming` is set to `True` 2023-02-14 23:06:14 +00:00			`from tests.unit_tests.callbacks.fake_callback_handler import FakeCallbackHandler`
initial commit 2022-10-24 21:51:15 +00:00

fix test name (#22) 2022-10-26 03:22:16 +00:00			`def test_openai_call() -> None:`
			`"""Test valid call to openai."""`
initial commit 2022-10-24 21:51:15 +00:00			`llm = OpenAI(max_tokens=10)`
			`output = llm("Say foo:")`
			`assert isinstance(output, str)`
Harrison/arbitrary params (#186) 2022-11-25 04:01:20 +00:00

			`def test_openai_extra_kwargs() -> None:`
			`"""Test extra kwargs to openai."""`
			`# Check that foo is saved in extra_kwargs.`
			`llm = OpenAI(foo=3, max_tokens=10)`
			`assert llm.max_tokens == 10`
			`assert llm.model_kwargs == {"foo": 3}`

			`# Test that if extra_kwargs are provided, they are added to it.`
			`llm = OpenAI(foo=3, model_kwargs={"bar": 2})`
			`assert llm.model_kwargs == {"foo": 3, "bar": 2}`

			`# Test that if provided twice it errors`
			`with pytest.raises(ValueError):`
			`OpenAI(foo=3, model_kwargs={"foo": 2})`
allow passing of stop params into openai (#232) 2022-12-01 06:20:13 +00:00
Check OpenAI model kwargs (#4366) Handle duplicate and incorrectly specified OpenAI params Thanks @PawelFaron for the fix! Made small update Closes #4331 --------- Co-authored-by: PawelFaron <42373772+PawelFaron@users.noreply.github.com> Co-authored-by: Pawel Faron <ext-pawel.faron@vaisala.com> 2023-05-08 23:37:34 +00:00			`# Test that if explicit param is specified in kwargs it errors`
			`with pytest.raises(ValueError):`
			`OpenAI(model_kwargs={"temperature": 0.2})`

			`# Test that "model" cannot be specified in kwargs`
			`with pytest.raises(ValueError):`
			`OpenAI(model_kwargs={"model": "text-davinci-003"})`

allow passing of stop params into openai (#232) 2022-12-01 06:20:13 +00:00
(OpenAI) Add model_name to LLMResult.llm_output (#1713) Given that different models have very different latencies and pricings, it's benefitial to pass the information about the model that generated the response. Such information allows implementing custom callback managers and track usage and price per model. Addresses https://github.com/hwchase17/langchain/issues/1557. 2023-03-17 04:55:55 +00:00			`def test_openai_llm_output_contains_model_name() -> None:`
			`"""Test llm_output contains model_name."""`
			`llm = OpenAI(max_tokens=10)`
			`llm_result = llm.generate(["Hello, how are you?"])`
			`assert llm_result.llm_output is not None`
			`assert llm_result.llm_output["model_name"] == llm.model_name`


allow passing of stop params into openai (#232) 2022-12-01 06:20:13 +00:00			`def test_openai_stop_valid() -> None:`
			`"""Test openai stop logic on valid configuration."""`
			`query = "write an ordered list of five items"`
			`first_llm = OpenAI(stop="3", temperature=0)`
			`first_output = first_llm(query)`
			`second_llm = OpenAI(temperature=0)`
			`second_output = second_llm(query, stop=["3"])`
			`# Because it stops on new lines, shouldn't return anything`
			`assert first_output == second_output`


			`def test_openai_stop_error() -> None:`
			`"""Test openai stop logic on bad configuration."""`
			`llm = OpenAI(stop="3", temperature=0)`
			`with pytest.raises(ValueError):`
			`llm("write an ordered list of five items", stop=["\n"])`
Harrison/llm saving (#331) Co-authored-by: Akash Samant <70665700+asamant21@users.noreply.github.com> 2022-12-13 14:46:01 +00:00

			`def test_saving_loading_llm(tmp_path: Path) -> None:`
fix `ChatOpenAI.agenerate` (#1504) 2023-03-07 23:22:05 +00:00			`"""Test saving/loading an OpenAI LLM."""`
Harrison/llm saving (#331) Co-authored-by: Akash Samant <70665700+asamant21@users.noreply.github.com> 2022-12-13 14:46:01 +00:00			`llm = OpenAI(max_tokens=10)`
			`llm.save(file_path=tmp_path / "openai.yaml")`
			`loaded_llm = load_llm(tmp_path / "openai.yaml")`
			`assert loaded_llm == llm`
Support Streaming Tokens from OpenAI (#364) https://github.com/hwchase17/langchain/issues/363 @hwchase17 how much does this make you want to cry? 2022-12-17 15:02:58 +00:00

			`def test_openai_streaming() -> None:`
			`"""Test streaming tokens from OpenAI."""`
			`llm = OpenAI(max_tokens=10)`
			`generator = llm.stream("I'm Pickle Rick")`

			`assert isinstance(generator, Generator)`

			`for token in generator:`
			`assert isinstance(token["choices"][0]["text"], str)`


			`def test_openai_streaming_error() -> None:`
			`"""Test error handling in stream."""`
			`llm = OpenAI(best_of=2)`
			`with pytest.raises(ValueError):`
			`llm.stream("I'm Pickle Rick")`
Add asyncio support for LLM (OpenAI), Chain (LLMChain, LLMMathChain), and Agent (#841) Supporting asyncio in langchain primitives allows for users to run them concurrently and creates more seamless integration with asyncio-supported frameworks (FastAPI, etc.) Summary of changes: LLM * Add `agenerate` and `_agenerate` * Implement in OpenAI by leveraging `client.Completions.acreate` Chain * Add `arun`, `acall`, `_acall` * Implement them in `LLMChain` and `LLMMathChain` for now Agent * Refactor and leverage async chain and llm methods * Add ability for `Tools` to contain async coroutine * Implement async SerpaPI `arun` Create demo notebook. Open questions: * Should all the async stuff go in separate classes? I've seen both patterns (keeping the same class and having async and sync methods vs. having class separation) 2023-02-08 05:21:57 +00:00

Enable streaming for OpenAI LLM (#986) * Support a callback `on_llm_new_token` that users can implement when `OpenAI.streaming` is set to `True` 2023-02-14 23:06:14 +00:00			`def test_openai_streaming_best_of_error() -> None:`
			`"""Test validation for streaming fails if best_of is not 1."""`
			`with pytest.raises(ValueError):`
			`OpenAI(best_of=2, streaming=True)`


			`def test_openai_streaming_n_error() -> None:`
			`"""Test validation for streaming fails if n is not 1."""`
			`with pytest.raises(ValueError):`
			`OpenAI(n=2, streaming=True)`


			`def test_openai_streaming_multiple_prompts_error() -> None:`
			`"""Test validation for streaming fails if multiple prompts are given."""`
			`with pytest.raises(ValueError):`
			`OpenAI(streaming=True).generate(["I'm Pickle Rick", "I'm Pickle Rick"])`


			`def test_openai_streaming_call() -> None:`
			`"""Test valid call to openai."""`
			`llm = OpenAI(max_tokens=10, streaming=True)`
			`output = llm("Say foo:")`
			`assert isinstance(output, str)`


			`def test_openai_streaming_callback() -> None:`
			`"""Test that streaming correctly invokes on_llm_new_token callback."""`
			`callback_handler = FakeCallbackHandler()`
			`callback_manager = CallbackManager([callback_handler])`
			`llm = OpenAI(`
			`max_tokens=10,`
			`streaming=True,`
			`temperature=0,`
			`callback_manager=callback_manager,`
			`verbose=True,`
			`)`
			`llm("Write me a sentence with 100 words.")`
			`assert callback_handler.llm_streams == 10`


Add asyncio support for LLM (OpenAI), Chain (LLMChain, LLMMathChain), and Agent (#841) Supporting asyncio in langchain primitives allows for users to run them concurrently and creates more seamless integration with asyncio-supported frameworks (FastAPI, etc.) Summary of changes: LLM * Add `agenerate` and `_agenerate` * Implement in OpenAI by leveraging `client.Completions.acreate` Chain * Add `arun`, `acall`, `_acall` * Implement them in `LLMChain` and `LLMMathChain` for now Agent * Refactor and leverage async chain and llm methods * Add ability for `Tools` to contain async coroutine * Implement async SerpaPI `arun` Create demo notebook. Open questions: * Should all the async stuff go in separate classes? I've seen both patterns (keeping the same class and having async and sync methods vs. having class separation) 2023-02-08 05:21:57 +00:00			`@pytest.mark.asyncio`
			`async def test_openai_async_generate() -> None:`
			`"""Test async generation."""`
			`llm = OpenAI(max_tokens=10)`
			`output = await llm.agenerate(["Hello, how are you?"])`
			`assert isinstance(output, LLMResult)`
Enable streaming for OpenAI LLM (#986) * Support a callback `on_llm_new_token` that users can implement when `OpenAI.streaming` is set to `True` 2023-02-14 23:06:14 +00:00

			`@pytest.mark.asyncio`
			`async def test_openai_async_streaming_callback() -> None:`
			`"""Test that streaming correctly invokes on_llm_new_token callback."""`
			`callback_handler = FakeCallbackHandler()`
			`callback_manager = CallbackManager([callback_handler])`
			`llm = OpenAI(`
			`max_tokens=10,`
			`streaming=True,`
			`temperature=0,`
			`callback_manager=callback_manager,`
			`verbose=True,`
			`)`
			`result = await llm.agenerate(["Write me a sentence with 100 words."])`
			`assert callback_handler.llm_streams == 10`
			`assert isinstance(result, LLMResult)`
add async and streaming support to `OpenAIChat` (#1378) title says it all 2023-03-02 05:55:43 +00:00

Allow the regular openai class to be used for ChatGPT models (#1393) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> 2023-03-02 17:04:18 +00:00			`def test_openai_chat_wrong_class() -> None:`
			`"""Test OpenAIChat with wrong class still works."""`
			`llm = OpenAI(model_name="gpt-3.5-turbo")`
			`output = llm("Say foo:")`
			`assert isinstance(output, str)`


add async and streaming support to `OpenAIChat` (#1378) title says it all 2023-03-02 05:55:43 +00:00			`def test_openai_chat() -> None:`
			`"""Test OpenAIChat."""`
			`llm = OpenAIChat(max_tokens=10)`
			`output = llm("Say foo:")`
			`assert isinstance(output, str)`


			`def test_openai_chat_streaming() -> None:`
			`"""Test OpenAIChat with streaming option."""`
			`llm = OpenAIChat(max_tokens=10, streaming=True)`
			`output = llm("Say foo:")`
			`assert isinstance(output, str)`


			`def test_openai_chat_streaming_callback() -> None:`
			`"""Test that streaming correctly invokes on_llm_new_token callback."""`
			`callback_handler = FakeCallbackHandler()`
			`callback_manager = CallbackManager([callback_handler])`
			`llm = OpenAIChat(`
			`max_tokens=10,`
			`streaming=True,`
			`temperature=0,`
			`callback_manager=callback_manager,`
			`verbose=True,`
			`)`
			`llm("Write me a sentence with 100 words.")`
			`assert callback_handler.llm_streams != 0`


			`@pytest.mark.asyncio`
			`async def test_openai_chat_async_generate() -> None:`
			`"""Test async chat."""`
			`llm = OpenAIChat(max_tokens=10)`
			`output = await llm.agenerate(["Hello, how are you?"])`
			`assert isinstance(output, LLMResult)`


			`@pytest.mark.asyncio`
			`async def test_openai_chat_async_streaming_callback() -> None:`
			`"""Test that streaming correctly invokes on_llm_new_token callback."""`
			`callback_handler = FakeCallbackHandler()`
			`callback_manager = CallbackManager([callback_handler])`
			`llm = OpenAIChat(`
			`max_tokens=10,`
			`streaming=True,`
			`temperature=0,`
			`callback_manager=callback_manager,`
			`verbose=True,`
			`)`
			`result = await llm.agenerate(["Write me a sentence with 100 words."])`
			`assert callback_handler.llm_streams != 0`
			`assert isinstance(result, LLMResult)`
OpenAI LLM: update `modelname_to_contextsize` with new models (#2843) Token counts pulled from https://openai.com/pricing 2023-04-13 18:13:34 +00:00

			`def test_openai_modelname_to_contextsize_valid() -> None:`
			`"""Test model name to context size on a valid model."""`
			`assert OpenAI().modelname_to_contextsize("davinci") == 2049`


			`def test_openai_modelname_to_contextsize_invalid() -> None:`
			`"""Test model name to context size on an invalid model."""`
			`with pytest.raises(ValueError):`
			`OpenAI().modelname_to_contextsize("foobar")`