langchain/libs/community/tests/unit_tests/callbacks/test_openai_info.py

from unittest.mock import MagicMock
from uuid import uuid4

import pytest
from langchain_core.outputs import LLMResult

from langchain_community.callbacks import OpenAICallbackHandler
from langchain_community.llms.openai import BaseOpenAI


@pytest.fixture
def handler() -> OpenAICallbackHandler:
    return OpenAICallbackHandler()


def test_on_llm_end(handler: OpenAICallbackHandler) -> None:
    response = LLMResult(
        generations=[],
        llm_output={
            "token_usage": {
                "prompt_tokens": 2,
                "completion_tokens": 1,
                "total_tokens": 3,
            },
            "model_name": BaseOpenAI.__fields__["model_name"].default,
        },
    )
    handler.on_llm_end(response)
    assert handler.successful_requests == 1
    assert handler.total_tokens == 3
    assert handler.prompt_tokens == 2
    assert handler.completion_tokens == 1
    assert handler.total_cost > 0


def test_on_llm_end_custom_model(handler: OpenAICallbackHandler) -> None:
    response = LLMResult(
        generations=[],
        llm_output={
            "token_usage": {
                "prompt_tokens": 2,
                "completion_tokens": 1,
                "total_tokens": 3,
            },
            "model_name": "foo-bar",
        },
    )
    handler.on_llm_end(response)
    assert handler.total_cost == 0


@pytest.mark.parametrize(
    "model_name, expected_cost",
    [
        ("ada:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.0032),
        ("babbage:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.0048),
        ("curie:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.024),
        ("davinci:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.24),
        ("ft:babbage-002:your-org:custom-model-name:1abcdefg", 0.0032),
        ("ft:davinci-002:your-org:custom-model-name:1abcdefg", 0.024),
        ("ft:gpt-3.5-turbo-0613:your-org:custom-model-name:1abcdefg", 0.028),
        ("babbage-002.ft-0123456789abcdefghijklmnopqrstuv", 0.0008),
        ("davinci-002.ft-0123456789abcdefghijklmnopqrstuv", 0.004),
        ("gpt-35-turbo-0613.ft-0123456789abcdefghijklmnopqrstuv", 0.0035),
    ],
)
def test_on_llm_end_finetuned_model(
    handler: OpenAICallbackHandler, model_name: str, expected_cost: float
) -> None:
    response = LLMResult(
        generations=[],
        llm_output={
            "token_usage": {
                "prompt_tokens": 1000,
                "completion_tokens": 1000,
                "total_tokens": 2000,
            },
            "model_name": model_name,
        },
    )
    handler.on_llm_end(response)
    assert handler.total_cost == expected_cost


@pytest.mark.parametrize(
    "model_name,expected_cost",
    [
        ("gpt-35-turbo", 0.0035),
        ("gpt-35-turbo-0301", 0.0035),
        (
            "gpt-35-turbo-0613",
            0.0035,
        ),
        (
            "gpt-35-turbo-16k-0613",
            0.007,
        ),
        (
            "gpt-35-turbo-16k",
            0.007,
        ),
        ("gpt-4", 0.09),
        ("gpt-4-0314", 0.09),
        ("gpt-4-0613", 0.09),
        ("gpt-4-32k", 0.18),
        ("gpt-4-32k-0314", 0.18),
        ("gpt-4-32k-0613", 0.18),
    ],
)
def test_on_llm_end_azure_openai(
    handler: OpenAICallbackHandler, model_name: str, expected_cost: float
) -> None:
    response = LLMResult(
        generations=[],
        llm_output={
            "token_usage": {
                "prompt_tokens": 1000,
                "completion_tokens": 1000,
                "total_tokens": 2000,
            },
            "model_name": model_name,
        },
    )
    handler.on_llm_end(response)
    assert handler.total_cost == expected_cost


@pytest.mark.parametrize(
    "model_name", ["gpt-35-turbo-16k-0301", "gpt-4-0301", "gpt-4-32k-0301"]
)
def test_on_llm_end_no_cost_invalid_model(
    handler: OpenAICallbackHandler, model_name: str
) -> None:
    response = LLMResult(
        generations=[],
        llm_output={
            "token_usage": {
                "prompt_tokens": 1000,
                "completion_tokens": 1000,
                "total_tokens": 2000,
            },
            "model_name": model_name,
        },
    )
    handler.on_llm_end(response)
    assert handler.total_cost == 0


def test_on_retry_works(handler: OpenAICallbackHandler) -> None:
    handler.on_retry(MagicMock(), run_id=uuid4())
Default On Retry (#9230) Base callbacks don't have a default on retry event Fix #8542 --------- Co-authored-by: landonsilla <landon.silla@stepstone.com> 2023-08-14 23:45:17 +00:00			`from unittest.mock import MagicMock`
			`from uuid import uuid4`

Better custom model handling OpenAICallbackHandler (#4009) Thanks @maykcaldas for flagging! think this should resolve #3988. Let me know if you still see issues after next release. 2023-05-02 23:19:57 +00:00			`import pytest`
REFACTOR: Refactor langchain_core (#13627) Changes: - remove langchain_core/schema since no clear distinction b/n schema and non-schema modules - make every module that doesn't end in -y plural - where easy have 1-2 classes per file - no more than one level of nesting in directories - only import from top level core modules in langchain 2023-11-21 16:35:29 +00:00			`from langchain_core.outputs import LLMResult`
Better custom model handling OpenAICallbackHandler (#4009) Thanks @maykcaldas for flagging! think this should resolve #3988. Let me know if you still see issues after next release. 2023-05-02 23:19:57 +00:00
community[major], core[patch], langchain[patch], experimental[patch]: Create langchain-community (#14463) Moved the following modules to new package langchain-community in a backwards compatible fashion: ``` mv langchain/langchain/adapters community/langchain_community mv langchain/langchain/callbacks community/langchain_community/callbacks mv langchain/langchain/chat_loaders community/langchain_community mv langchain/langchain/chat_models community/langchain_community mv langchain/langchain/document_loaders community/langchain_community mv langchain/langchain/docstore community/langchain_community mv langchain/langchain/document_transformers community/langchain_community mv langchain/langchain/embeddings community/langchain_community mv langchain/langchain/graphs community/langchain_community mv langchain/langchain/llms community/langchain_community mv langchain/langchain/memory/chat_message_histories community/langchain_community mv langchain/langchain/retrievers community/langchain_community mv langchain/langchain/storage community/langchain_community mv langchain/langchain/tools community/langchain_community mv langchain/langchain/utilities community/langchain_community mv langchain/langchain/vectorstores community/langchain_community mv langchain/langchain/agents/agent_toolkits community/langchain_community mv langchain/langchain/cache.py community/langchain_community mv langchain/langchain/adapters community/langchain_community mv langchain/langchain/callbacks community/langchain_community/callbacks mv langchain/langchain/chat_loaders community/langchain_community mv langchain/langchain/chat_models community/langchain_community mv langchain/langchain/document_loaders community/langchain_community mv langchain/langchain/docstore community/langchain_community mv langchain/langchain/document_transformers community/langchain_community mv langchain/langchain/embeddings community/langchain_community mv langchain/langchain/graphs community/langchain_community mv langchain/langchain/llms community/langchain_community mv langchain/langchain/memory/chat_message_histories community/langchain_community mv langchain/langchain/retrievers community/langchain_community mv langchain/langchain/storage community/langchain_community mv langchain/langchain/tools community/langchain_community mv langchain/langchain/utilities community/langchain_community mv langchain/langchain/vectorstores community/langchain_community mv langchain/langchain/agents/agent_toolkits community/langchain_community mv langchain/langchain/cache.py community/langchain_community ``` Moved the following to core ``` mv langchain/langchain/utils/json_schema.py core/langchain_core/utils mv langchain/langchain/utils/html.py core/langchain_core/utils mv langchain/langchain/utils/strings.py core/langchain_core/utils cat langchain/langchain/utils/env.py >> core/langchain_core/utils/env.py rm langchain/langchain/utils/env.py ``` See .scripts/community_split/script_integrations.sh for all changes 2023-12-11 21:53:30 +00:00			`from langchain_community.callbacks import OpenAICallbackHandler`
			`from langchain_community.llms.openai import BaseOpenAI`
Better custom model handling OpenAICallbackHandler (#4009) Thanks @maykcaldas for flagging! think this should resolve #3988. Let me know if you still see issues after next release. 2023-05-02 23:19:57 +00:00

			`@pytest.fixture`
			`def handler() -> OpenAICallbackHandler:`
			`return OpenAICallbackHandler()`


			`def test_on_llm_end(handler: OpenAICallbackHandler) -> None:`
			`response = LLMResult(`
			`generations=[],`
			`llm_output={`
			`"token_usage": {`
			`"prompt_tokens": 2,`
			`"completion_tokens": 1,`
			`"total_tokens": 3,`
			`},`
			`"model_name": BaseOpenAI.__fields__["model_name"].default,`
			`},`
			`)`
			`handler.on_llm_end(response)`
			`assert handler.successful_requests == 1`
			`assert handler.total_tokens == 3`
			`assert handler.prompt_tokens == 2`
			`assert handler.completion_tokens == 1`
			`assert handler.total_cost > 0`


			`def test_on_llm_end_custom_model(handler: OpenAICallbackHandler) -> None:`
			`response = LLMResult(`
			`generations=[],`
			`llm_output={`
			`"token_usage": {`
			`"prompt_tokens": 2,`
			`"completion_tokens": 1,`
			`"total_tokens": 3,`
			`},`
			`"model_name": "foo-bar",`
			`},`
			`)`
			`handler.on_llm_end(response)`
			`assert handler.total_cost == 0`
fixing total cost finetuned model giving zero (#5144) # OpanAI finetuned model giving zero tokens cost Very simple fix to the previously committed solution to allowing finetuned Openai models. Improves #5127 --------- Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-24 17:04:08 +00:00

Finetuned OpenAI models cost calculation #11715 (#12190) Description: Add cost calculation for fine tuned models (new and legacy), this is required after OpenAI added new models for fine tuning and separated the costs of I/O for fine tuned models. Also I updated the relevant unit tests see https://platform.openai.com/docs/guides/fine-tuning for more information. issue: https://github.com/langchain-ai/langchain/issues/11715 - Issue: 11715 - Twitter handle: @nirkopler 2023-10-24 17:22:05 +00:00			`@pytest.mark.parametrize(`
fix(openai-callback): completion count logic (#12383) The changes introduced in #12267 and #12190 broke the cost computation of the `completion` tokens for fine-tuned models because of the early return. This PR aims at fixing this. @baskaryan. 2023-10-27 16:08:54 +00:00			`"model_name, expected_cost",`
Finetuned OpenAI models cost calculation #11715 (#12190) Description: Add cost calculation for fine tuned models (new and legacy), this is required after OpenAI added new models for fine tuning and separated the costs of I/O for fine tuned models. Also I updated the relevant unit tests see https://platform.openai.com/docs/guides/fine-tuning for more information. issue: https://github.com/langchain-ai/langchain/issues/11715 - Issue: 11715 - Twitter handle: @nirkopler 2023-10-24 17:22:05 +00:00			`[`
fix(openai-callback): completion count logic (#12383) The changes introduced in #12267 and #12190 broke the cost computation of the `completion` tokens for fine-tuned models because of the early return. This PR aims at fixing this. @baskaryan. 2023-10-27 16:08:54 +00:00			`("ada:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.0032),`
			`("babbage:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.0048),`
			`("curie:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.024),`
			`("davinci:ft-your-org:custom-model-name-2022-02-15-04-21-04", 0.24),`
			`("ft:babbage-002:your-org:custom-model-name:1abcdefg", 0.0032),`
			`("ft:davinci-002:your-org:custom-model-name:1abcdefg", 0.024),`
			`("ft:gpt-3.5-turbo-0613:your-org:custom-model-name:1abcdefg", 0.028),`
			`("babbage-002.ft-0123456789abcdefghijklmnopqrstuv", 0.0008),`
			`("davinci-002.ft-0123456789abcdefghijklmnopqrstuv", 0.004),`
			`("gpt-35-turbo-0613.ft-0123456789abcdefghijklmnopqrstuv", 0.0035),`
Finetuned OpenAI models cost calculation #11715 (#12190) Description: Add cost calculation for fine tuned models (new and legacy), this is required after OpenAI added new models for fine tuning and separated the costs of I/O for fine tuned models. Also I updated the relevant unit tests see https://platform.openai.com/docs/guides/fine-tuning for more information. issue: https://github.com/langchain-ai/langchain/issues/11715 - Issue: 11715 - Twitter handle: @nirkopler 2023-10-24 17:22:05 +00:00			`],`
			`)`
			`def test_on_llm_end_finetuned_model(`
fix(openai-callback): completion count logic (#12383) The changes introduced in #12267 and #12190 broke the cost computation of the `completion` tokens for fine-tuned models because of the early return. This PR aims at fixing this. @baskaryan. 2023-10-27 16:08:54 +00:00			`handler: OpenAICallbackHandler, model_name: str, expected_cost: float`
Finetuned OpenAI models cost calculation #11715 (#12190) Description: Add cost calculation for fine tuned models (new and legacy), this is required after OpenAI added new models for fine tuning and separated the costs of I/O for fine tuned models. Also I updated the relevant unit tests see https://platform.openai.com/docs/guides/fine-tuning for more information. issue: https://github.com/langchain-ai/langchain/issues/11715 - Issue: 11715 - Twitter handle: @nirkopler 2023-10-24 17:22:05 +00:00			`) -> None:`
fixing total cost finetuned model giving zero (#5144) # OpanAI finetuned model giving zero tokens cost Very simple fix to the previously committed solution to allowing finetuned Openai models. Improves #5127 --------- Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-24 17:04:08 +00:00			`response = LLMResult(`
			`generations=[],`
			`llm_output={`
			`"token_usage": {`
fix(openai-callback): completion count logic (#12383) The changes introduced in #12267 and #12190 broke the cost computation of the `completion` tokens for fine-tuned models because of the early return. This PR aims at fixing this. @baskaryan. 2023-10-27 16:08:54 +00:00			`"prompt_tokens": 1000,`
			`"completion_tokens": 1000,`
			`"total_tokens": 2000,`
fixing total cost finetuned model giving zero (#5144) # OpanAI finetuned model giving zero tokens cost Very simple fix to the previously committed solution to allowing finetuned Openai models. Improves #5127 --------- Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-24 17:04:08 +00:00			`},`
Finetuned OpenAI models cost calculation #11715 (#12190) Description: Add cost calculation for fine tuned models (new and legacy), this is required after OpenAI added new models for fine tuning and separated the costs of I/O for fine tuned models. Also I updated the relevant unit tests see https://platform.openai.com/docs/guides/fine-tuning for more information. issue: https://github.com/langchain-ai/langchain/issues/11715 - Issue: 11715 - Twitter handle: @nirkopler 2023-10-24 17:22:05 +00:00			`"model_name": model_name,`
fixing total cost finetuned model giving zero (#5144) # OpanAI finetuned model giving zero tokens cost Very simple fix to the previously committed solution to allowing finetuned Openai models. Improves #5127 --------- Co-authored-by: Dev 2049 <dev.dev2049@gmail.com> 2023-05-24 17:04:08 +00:00			`},`
			`)`
			`handler.on_llm_end(response)`
fix(openai-callback): completion count logic (#12383) The changes introduced in #12267 and #12190 broke the cost computation of the `completion` tokens for fine-tuned models because of the early return. This PR aims at fixing this. @baskaryan. 2023-10-27 16:08:54 +00:00			`assert handler.total_cost == expected_cost`
Feature/fix azureopenai model mappings (#8621) This pull request aims to ensure that the `OpenAICallbackHandler` can properly calculate the total cost for Azure OpenAI chat models. The following changes have resolved this issue: - The `model_name` has been added to the ChatResult llm_output. Without this, the default values of `gpt-35-turbo` were applied. This was causing the total cost for Azure OpenAI's GPT-4 to be significantly inaccurate. - A new parameter `model_version` has been added to `AzureChatOpenAI`. Azure does not include the model version in the response. With the addition of `model_name`, this is not a significant issue for GPT-4 models, but it's an issue for GPT-3.5-Turbo. Version 0301 (default) of GPT-3.5-Turbo on Azure has a flat rate of 0.002 per 1k tokens for both prompt and completion. However, version 0613 introduced a split in pricing for prompt and completion tokens. - The `OpenAICallbackHandler` implementation has been updated with the proper model names, versions, and cost per 1k tokens. Unit tests have been added to ensure the functionality works as expected; the Azure ChatOpenAI notebook has been updated with examples. Maintainers: @hwchase17, @baskaryan Twitter handle: @jjczopek --------- Co-authored-by: Jerzy Czopek <jerzy.czopek@avanade.com> Co-authored-by: Bagatur <baskaryan@gmail.com> 2023-08-09 17:56:15 +00:00

			`@pytest.mark.parametrize(`
			`"model_name,expected_cost",`
			`[`
			`("gpt-35-turbo", 0.0035),`
			`("gpt-35-turbo-0301", 0.0035),`
			`(`
			`"gpt-35-turbo-0613",`
			`0.0035,`
			`),`
			`(`
			`"gpt-35-turbo-16k-0613",`
			`0.007,`
			`),`
			`(`
			`"gpt-35-turbo-16k",`
			`0.007,`
			`),`
			`("gpt-4", 0.09),`
			`("gpt-4-0314", 0.09),`
			`("gpt-4-0613", 0.09),`
			`("gpt-4-32k", 0.18),`
			`("gpt-4-32k-0314", 0.18),`
			`("gpt-4-32k-0613", 0.18),`
			`],`
			`)`
			`def test_on_llm_end_azure_openai(`
			`handler: OpenAICallbackHandler, model_name: str, expected_cost: float`
			`) -> None:`
			`response = LLMResult(`
			`generations=[],`
			`llm_output={`
			`"token_usage": {`
			`"prompt_tokens": 1000,`
			`"completion_tokens": 1000,`
			`"total_tokens": 2000,`
			`},`
			`"model_name": model_name,`
			`},`
			`)`
			`handler.on_llm_end(response)`
			`assert handler.total_cost == expected_cost`


			`@pytest.mark.parametrize(`
			`"model_name", ["gpt-35-turbo-16k-0301", "gpt-4-0301", "gpt-4-32k-0301"]`
			`)`
			`def test_on_llm_end_no_cost_invalid_model(`
			`handler: OpenAICallbackHandler, model_name: str`
			`) -> None:`
			`response = LLMResult(`
			`generations=[],`
			`llm_output={`
			`"token_usage": {`
			`"prompt_tokens": 1000,`
			`"completion_tokens": 1000,`
			`"total_tokens": 2000,`
			`},`
			`"model_name": model_name,`
			`},`
			`)`
			`handler.on_llm_end(response)`
			`assert handler.total_cost == 0`
Default On Retry (#9230) Base callbacks don't have a default on retry event Fix #8542 --------- Co-authored-by: landonsilla <landon.silla@stepstone.com> 2023-08-14 23:45:17 +00:00

			`def test_on_retry_works(handler: OpenAICallbackHandler) -> None:`
			`handler.on_retry(MagicMock(), run_id=uuid4())`