langchain/libs/partners/anthropic/tests/unit_tests/test_chat_models.py

"""Test chat model integration."""

import os
from typing import Any, Callable, Dict, Literal, Type, cast

import pytest
from anthropic.types import ContentBlock, Message, Usage
from langchain_core.messages import AIMessage, HumanMessage, SystemMessage, ToolMessage
from langchain_core.outputs import ChatGeneration, ChatResult
from langchain_core.pydantic_v1 import BaseModel, Field, SecretStr
from langchain_core.tools import BaseTool

from langchain_anthropic import ChatAnthropic
from langchain_anthropic.chat_models import (
    _format_messages,
    _merge_messages,
    convert_to_anthropic_tool,
)

os.environ["ANTHROPIC_API_KEY"] = "foo"


def test_initialization() -> None:
    """Test chat model initialization."""
    for model in [
        ChatAnthropic(model_name="claude-instant-1.2", api_key="xyz", timeout=2),
        ChatAnthropic(
            model="claude-instant-1.2",
            anthropic_api_key="xyz",
            default_request_timeout=2,
        ),
    ]:
        assert model.model == "claude-instant-1.2"
        assert cast(SecretStr, model.anthropic_api_key).get_secret_value() == "xyz"
        assert model.default_request_timeout == 2.0


@pytest.mark.requires("anthropic")
def test_anthropic_model_name_param() -> None:
    llm = ChatAnthropic(model_name="foo")
    assert llm.model == "foo"


@pytest.mark.requires("anthropic")
def test_anthropic_model_param() -> None:
    llm = ChatAnthropic(model="foo")
    assert llm.model == "foo"


@pytest.mark.requires("anthropic")
def test_anthropic_model_kwargs() -> None:
    llm = ChatAnthropic(model_name="foo", model_kwargs={"foo": "bar"})
    assert llm.model_kwargs == {"foo": "bar"}


@pytest.mark.requires("anthropic")
def test_anthropic_invalid_model_kwargs() -> None:
    with pytest.raises(ValueError):
        ChatAnthropic(model="foo", model_kwargs={"max_tokens_to_sample": 5})


@pytest.mark.requires("anthropic")
def test_anthropic_incorrect_field() -> None:
    with pytest.warns(match="not default parameter"):
        llm = ChatAnthropic(model="foo", foo="bar")
    assert llm.model_kwargs == {"foo": "bar"}


@pytest.mark.requires("anthropic")
def test_anthropic_initialization() -> None:
    """Test anthropic initialization."""
    # Verify that chat anthropic can be initialized using a secret key provided
    # as a parameter rather than an environment variable.
    ChatAnthropic(model="test", anthropic_api_key="test")


def test__format_output() -> None:
    anthropic_msg = Message(
        id="foo",
        content=[ContentBlock(type="text", text="bar")],
        model="baz",
        role="assistant",
        stop_reason=None,
        stop_sequence=None,
        usage=Usage(input_tokens=2, output_tokens=1),
        type="message",
    )
    expected = ChatResult(
        generations=[
            ChatGeneration(message=AIMessage("bar")),
        ],
        llm_output={
            "id": "foo",
            "model": "baz",
            "stop_reason": None,
            "stop_sequence": None,
            "usage": {"input_tokens": 2, "output_tokens": 1},
        },
    )
    llm = ChatAnthropic(model="test", anthropic_api_key="test")
    actual = llm._format_output(anthropic_msg)
    assert expected == actual


def test__merge_messages() -> None:
    messages = [
        SystemMessage("foo"),
        HumanMessage("bar"),
        AIMessage(
            [
                {"text": "baz", "type": "text"},
                {
                    "tool_input": {"a": "b"},
                    "type": "tool_use",
                    "id": "1",
                    "text": None,
                    "name": "buz",
                },
                {"text": "baz", "type": "text"},
                {
                    "tool_input": {"a": "c"},
                    "type": "tool_use",
                    "id": "2",
                    "text": None,
                    "name": "blah",
                },
            ]
        ),
        ToolMessage("buz output", tool_call_id="1"),
        ToolMessage("blah output", tool_call_id="2"),
        HumanMessage("next thing"),
    ]
    expected = [
        SystemMessage("foo"),
        HumanMessage("bar"),
        AIMessage(
            [
                {"text": "baz", "type": "text"},
                {
                    "tool_input": {"a": "b"},
                    "type": "tool_use",
                    "id": "1",
                    "text": None,
                    "name": "buz",
                },
                {"text": "baz", "type": "text"},
                {
                    "tool_input": {"a": "c"},
                    "type": "tool_use",
                    "id": "2",
                    "text": None,
                    "name": "blah",
                },
            ]
        ),
        HumanMessage(
            [
                {"type": "tool_result", "content": "buz output", "tool_use_id": "1"},
                {"type": "tool_result", "content": "blah output", "tool_use_id": "2"},
                {"type": "text", "text": "next thing"},
            ]
        ),
    ]
    actual = _merge_messages(messages)
    assert expected == actual


def test__merge_messages_mutation() -> None:
    original_messages = [
        HumanMessage([{"type": "text", "text": "bar"}]),
        HumanMessage("next thing"),
    ]
    messages = [
        HumanMessage([{"type": "text", "text": "bar"}]),
        HumanMessage("next thing"),
    ]
    expected = [
        HumanMessage(
            [{"type": "text", "text": "bar"}, {"type": "text", "text": "next thing"}]
        ),
    ]
    actual = _merge_messages(messages)
    assert expected == actual
    assert messages == original_messages


@pytest.fixture()
def pydantic() -> Type[BaseModel]:
    class dummy_function(BaseModel):
        """dummy function"""

        arg1: int = Field(..., description="foo")
        arg2: Literal["bar", "baz"] = Field(..., description="one of 'bar', 'baz'")

    return dummy_function


@pytest.fixture()
def function() -> Callable:
    def dummy_function(arg1: int, arg2: Literal["bar", "baz"]) -> None:
        """dummy function

        Args:
            arg1: foo
            arg2: one of 'bar', 'baz'
        """
        pass

    return dummy_function


@pytest.fixture()
def dummy_tool() -> BaseTool:
    class Schema(BaseModel):
        arg1: int = Field(..., description="foo")
        arg2: Literal["bar", "baz"] = Field(..., description="one of 'bar', 'baz'")

    class DummyFunction(BaseTool):
        args_schema: Type[BaseModel] = Schema
        name: str = "dummy_function"
        description: str = "dummy function"

        def _run(self, *args: Any, **kwargs: Any) -> Any:
            pass

    return DummyFunction()


@pytest.fixture()
def json_schema() -> Dict:
    return {
        "title": "dummy_function",
        "description": "dummy function",
        "type": "object",
        "properties": {
            "arg1": {"description": "foo", "type": "integer"},
            "arg2": {
                "description": "one of 'bar', 'baz'",
                "enum": ["bar", "baz"],
                "type": "string",
            },
        },
        "required": ["arg1", "arg2"],
    }


@pytest.fixture()
def openai_function() -> Dict:
    return {
        "name": "dummy_function",
        "description": "dummy function",
        "parameters": {
            "type": "object",
            "properties": {
                "arg1": {"description": "foo", "type": "integer"},
                "arg2": {
                    "description": "one of 'bar', 'baz'",
                    "enum": ["bar", "baz"],
                    "type": "string",
                },
            },
            "required": ["arg1", "arg2"],
        },
    }


def test_convert_to_anthropic_tool(
    pydantic: Type[BaseModel],
    function: Callable,
    dummy_tool: BaseTool,
    json_schema: Dict,
    openai_function: Dict,
) -> None:
    expected = {
        "name": "dummy_function",
        "description": "dummy function",
        "input_schema": {
            "type": "object",
            "properties": {
                "arg1": {"description": "foo", "type": "integer"},
                "arg2": {
                    "description": "one of 'bar', 'baz'",
                    "enum": ["bar", "baz"],
                    "type": "string",
                },
            },
            "required": ["arg1", "arg2"],
        },
    }

    for fn in (pydantic, function, dummy_tool, json_schema, expected, openai_function):
        actual = convert_to_anthropic_tool(fn)  # type: ignore
        assert actual == expected


def test__format_messages_with_tool_calls() -> None:
    system = SystemMessage("fuzz")
    human = HumanMessage("foo")
    ai = AIMessage(
        "",
        tool_calls=[{"name": "bar", "id": "1", "args": {"baz": "buzz"}}],
    )
    tool = ToolMessage(
        "blurb",
        tool_call_id="1",
    )
    messages = [system, human, ai, tool]
    expected = (
        "fuzz",
        [
            {"role": "user", "content": "foo"},
            {
                "role": "assistant",
                "content": [
                    {
                        "type": "tool_use",
                        "name": "bar",
                        "id": "1",
                        "input": {"baz": "buzz"},
                    }
                ],
            },
            {
                "role": "user",
                "content": [
                    {"type": "tool_result", "content": "blurb", "tool_use_id": "1"}
                ],
            },
        ],
    )
    actual = _format_messages(messages)
    assert expected == actual


def test__format_messages_with_str_content_and_tool_calls() -> None:
    system = SystemMessage("fuzz")
    human = HumanMessage("foo")
    # If content and tool_calls are specified and content is a string, then both are
    # included with content first.
    ai = AIMessage(
        "thought",
        tool_calls=[{"name": "bar", "id": "1", "args": {"baz": "buzz"}}],
    )
    tool = ToolMessage(
        "blurb",
        tool_call_id="1",
    )
    messages = [system, human, ai, tool]
    expected = (
        "fuzz",
        [
            {"role": "user", "content": "foo"},
            {
                "role": "assistant",
                "content": [
                    {
                        "type": "text",
                        "text": "thought",
                    },
                    {
                        "type": "tool_use",
                        "name": "bar",
                        "id": "1",
                        "input": {"baz": "buzz"},
                    },
                ],
            },
            {
                "role": "user",
                "content": [
                    {"type": "tool_result", "content": "blurb", "tool_use_id": "1"}
                ],
            },
        ],
    )
    actual = _format_messages(messages)
    assert expected == actual


def test__format_messages_with_list_content_and_tool_calls() -> None:
    system = SystemMessage("fuzz")
    human = HumanMessage("foo")
    # If content and tool_calls are specified and content is a list, then content is
    # preferred.
    ai = AIMessage(
        [
            {
                "type": "text",
                "text": "thought",
            }
        ],
        tool_calls=[{"name": "bar", "id": "1", "args": {"baz": "buzz"}}],
    )
    tool = ToolMessage(
        "blurb",
        tool_call_id="1",
    )
    messages = [system, human, ai, tool]
    expected = (
        "fuzz",
        [
            {"role": "user", "content": "foo"},
            {
                "role": "assistant",
                "content": [
                    {
                        "type": "text",
                        "text": "thought",
                    }
                ],
            },
            {
                "role": "user",
                "content": [
                    {"type": "tool_result", "content": "blurb", "tool_use_id": "1"}
                ],
            },
        ],
    )
    actual = _format_messages(messages)
    assert expected == actual
anthropic: beta messages integration (#14928) 2023-12-20 02:55:19 +00:00			`"""Test chat model integration."""`

anthropic[minor]: package move (#17974) 2024-02-26 05:57:26 +00:00			`import os`
anthropic[patch]: standardize init args (#20161) Related to #20085 2024-04-08 17:09:06 +00:00			`from typing import Any, Callable, Dict, Literal, Type, cast`
anthropic: beta messages integration (#14928) 2023-12-20 02:55:19 +00:00
anthropic[minor]: package move (#17974) 2024-02-26 05:57:26 +00:00			`import pytest`
anthropic[patch]: fix response metadata type (#19683) 2024-03-28 06:16:26 +00:00			`from anthropic.types import ContentBlock, Message, Usage`
anthropic[minor]: tool use (#20016) 2024-04-04 20:22:48 +00:00			`from langchain_core.messages import AIMessage, HumanMessage, SystemMessage, ToolMessage`
anthropic[patch]: fix response metadata type (#19683) 2024-03-28 06:16:26 +00:00			`from langchain_core.outputs import ChatGeneration, ChatResult`
anthropic[patch]: standardize init args (#20161) Related to #20085 2024-04-08 17:09:06 +00:00			`from langchain_core.pydantic_v1 import BaseModel, Field, SecretStr`
anthropic[minor]: tool use (#20016) 2024-04-04 20:22:48 +00:00			`from langchain_core.tools import BaseTool`
anthropic[minor]: package move (#17974) 2024-02-26 05:57:26 +00:00
anthropic[patch]: standardize init args (#20161) Related to #20085 2024-04-08 17:09:06 +00:00			`from langchain_anthropic import ChatAnthropic`
anthropic[patch]: release 0.1.9, use tool calls if content is empty (#20535) 2024-04-16 22:27:29 +00:00			`from langchain_anthropic.chat_models import (`
			`_format_messages,`
			`_merge_messages,`
			`convert_to_anthropic_tool,`
			`)`
anthropic[minor]: package move (#17974) 2024-02-26 05:57:26 +00:00
			`os.environ["ANTHROPIC_API_KEY"] = "foo"`
anthropic: beta messages integration (#14928) 2023-12-20 02:55:19 +00:00

			`def test_initialization() -> None:`
			`"""Test chat model initialization."""`
anthropic[patch]: standardize init args (#20161) Related to #20085 2024-04-08 17:09:06 +00:00			`for model in [`
			`ChatAnthropic(model_name="claude-instant-1.2", api_key="xyz", timeout=2),`
			`ChatAnthropic(`
			`model="claude-instant-1.2",`
			`anthropic_api_key="xyz",`
			`default_request_timeout=2,`
			`),`
			`]:`
			`assert model.model == "claude-instant-1.2"`
			`assert cast(SecretStr, model.anthropic_api_key).get_secret_value() == "xyz"`
			`assert model.default_request_timeout == 2.0`
anthropic[minor]: package move (#17974) 2024-02-26 05:57:26 +00:00

			`@pytest.mark.requires("anthropic")`
			`def test_anthropic_model_name_param() -> None:`
			`llm = ChatAnthropic(model_name="foo")`
			`assert llm.model == "foo"`


			`@pytest.mark.requires("anthropic")`
			`def test_anthropic_model_param() -> None:`
			`llm = ChatAnthropic(model="foo")`
			`assert llm.model == "foo"`


			`@pytest.mark.requires("anthropic")`
			`def test_anthropic_model_kwargs() -> None:`
			`llm = ChatAnthropic(model_name="foo", model_kwargs={"foo": "bar"})`
			`assert llm.model_kwargs == {"foo": "bar"}`


			`@pytest.mark.requires("anthropic")`
			`def test_anthropic_invalid_model_kwargs() -> None:`
			`with pytest.raises(ValueError):`
			`ChatAnthropic(model="foo", model_kwargs={"max_tokens_to_sample": 5})`


			`@pytest.mark.requires("anthropic")`
			`def test_anthropic_incorrect_field() -> None:`
			`with pytest.warns(match="not default parameter"):`
			`llm = ChatAnthropic(model="foo", foo="bar")`
			`assert llm.model_kwargs == {"foo": "bar"}`


			`@pytest.mark.requires("anthropic")`
			`def test_anthropic_initialization() -> None:`
			`"""Test anthropic initialization."""`
			`# Verify that chat anthropic can be initialized using a secret key provided`
			`# as a parameter rather than an environment variable.`
			`ChatAnthropic(model="test", anthropic_api_key="test")`
anthropic[patch]: fix response metadata type (#19683) 2024-03-28 06:16:26 +00:00

			`def test__format_output() -> None:`
			`anthropic_msg = Message(`
			`id="foo",`
			`content=[ContentBlock(type="text", text="bar")],`
			`model="baz",`
			`role="assistant",`
			`stop_reason=None,`
			`stop_sequence=None,`
			`usage=Usage(input_tokens=2, output_tokens=1),`
			`type="message",`
			`)`
			`expected = ChatResult(`
			`generations=[`
			`ChatGeneration(message=AIMessage("bar")),`
			`],`
			`llm_output={`
			`"id": "foo",`
			`"model": "baz",`
			`"stop_reason": None,`
			`"stop_sequence": None,`
			`"usage": {"input_tokens": 2, "output_tokens": 1},`
			`},`
			`)`
			`llm = ChatAnthropic(model="test", anthropic_api_key="test")`
			`actual = llm._format_output(anthropic_msg)`
			`assert expected == actual`
anthropic[minor]: tool use (#20016) 2024-04-04 20:22:48 +00:00

			`def test__merge_messages() -> None:`
			`messages = [`
			`SystemMessage("foo"),`
			`HumanMessage("bar"),`
			`AIMessage(`
			`[`
			`{"text": "baz", "type": "text"},`
			`{`
			`"tool_input": {"a": "b"},`
			`"type": "tool_use",`
			`"id": "1",`
			`"text": None,`
			`"name": "buz",`
			`},`
			`{"text": "baz", "type": "text"},`
			`{`
			`"tool_input": {"a": "c"},`
			`"type": "tool_use",`
			`"id": "2",`
			`"text": None,`
			`"name": "blah",`
			`},`
			`]`
			`),`
			`ToolMessage("buz output", tool_call_id="1"),`
			`ToolMessage("blah output", tool_call_id="2"),`
			`HumanMessage("next thing"),`
			`]`
			`expected = [`
			`SystemMessage("foo"),`
			`HumanMessage("bar"),`
			`AIMessage(`
			`[`
			`{"text": "baz", "type": "text"},`
			`{`
			`"tool_input": {"a": "b"},`
			`"type": "tool_use",`
			`"id": "1",`
			`"text": None,`
			`"name": "buz",`
			`},`
			`{"text": "baz", "type": "text"},`
			`{`
			`"tool_input": {"a": "c"},`
			`"type": "tool_use",`
			`"id": "2",`
			`"text": None,`
			`"name": "blah",`
			`},`
			`]`
			`),`
			`HumanMessage(`
			`[`
			`{"type": "tool_result", "content": "buz output", "tool_use_id": "1"},`
			`{"type": "tool_result", "content": "blah output", "tool_use_id": "2"},`
			`{"type": "text", "text": "next thing"},`
			`]`
			`),`
			`]`
			`actual = _merge_messages(messages)`
			`assert expected == actual`


anthropic[patch]: fix msg mutation (#20572) 2024-04-17 22:47:19 +00:00			`def test__merge_messages_mutation() -> None:`
			`original_messages = [`
			`HumanMessage([{"type": "text", "text": "bar"}]),`
			`HumanMessage("next thing"),`
			`]`
			`messages = [`
			`HumanMessage([{"type": "text", "text": "bar"}]),`
			`HumanMessage("next thing"),`
			`]`
			`expected = [`
			`HumanMessage(`
			`[{"type": "text", "text": "bar"}, {"type": "text", "text": "next thing"}]`
			`),`
			`]`
			`actual = _merge_messages(messages)`
			`assert expected == actual`
			`assert messages == original_messages`


anthropic[minor]: tool use (#20016) 2024-04-04 20:22:48 +00:00			`@pytest.fixture()`
			`def pydantic() -> Type[BaseModel]:`
			`class dummy_function(BaseModel):`
			`"""dummy function"""`

			`arg1: int = Field(..., description="foo")`
			`arg2: Literal["bar", "baz"] = Field(..., description="one of 'bar', 'baz'")`

			`return dummy_function`


			`@pytest.fixture()`
			`def function() -> Callable:`
			`def dummy_function(arg1: int, arg2: Literal["bar", "baz"]) -> None:`
			`"""dummy function`

			`Args:`
			`arg1: foo`
			`arg2: one of 'bar', 'baz'`
			`"""`
			`pass`

			`return dummy_function`


			`@pytest.fixture()`
			`def dummy_tool() -> BaseTool:`
			`class Schema(BaseModel):`
			`arg1: int = Field(..., description="foo")`
			`arg2: Literal["bar", "baz"] = Field(..., description="one of 'bar', 'baz'")`

			`class DummyFunction(BaseTool):`
			`args_schema: Type[BaseModel] = Schema`
			`name: str = "dummy_function"`
			`description: str = "dummy function"`

			`def _run(self, args: Any, *kwargs: Any) -> Any:`
			`pass`

			`return DummyFunction()`


			`@pytest.fixture()`
			`def json_schema() -> Dict:`
			`return {`
			`"title": "dummy_function",`
			`"description": "dummy function",`
			`"type": "object",`
			`"properties": {`
			`"arg1": {"description": "foo", "type": "integer"},`
			`"arg2": {`
			`"description": "one of 'bar', 'baz'",`
			`"enum": ["bar", "baz"],`
			`"type": "string",`
			`},`
			`},`
			`"required": ["arg1", "arg2"],`
			`}`


			`@pytest.fixture()`
			`def openai_function() -> Dict:`
			`return {`
			`"name": "dummy_function",`
			`"description": "dummy function",`
			`"parameters": {`
			`"type": "object",`
			`"properties": {`
			`"arg1": {"description": "foo", "type": "integer"},`
			`"arg2": {`
			`"description": "one of 'bar', 'baz'",`
			`"enum": ["bar", "baz"],`
			`"type": "string",`
			`},`
			`},`
			`"required": ["arg1", "arg2"],`
			`},`
			`}`


			`def test_convert_to_anthropic_tool(`
			`pydantic: Type[BaseModel],`
			`function: Callable,`
			`dummy_tool: BaseTool,`
			`json_schema: Dict,`
			`openai_function: Dict,`
			`) -> None:`
			`expected = {`
			`"name": "dummy_function",`
			`"description": "dummy function",`
			`"input_schema": {`
			`"type": "object",`
			`"properties": {`
			`"arg1": {"description": "foo", "type": "integer"},`
			`"arg2": {`
			`"description": "one of 'bar', 'baz'",`
			`"enum": ["bar", "baz"],`
			`"type": "string",`
			`},`
			`},`
			`"required": ["arg1", "arg2"],`
			`},`
			`}`

			`for fn in (pydantic, function, dummy_tool, json_schema, expected, openai_function):`
			`actual = convert_to_anthropic_tool(fn) # type: ignore`
			`assert actual == expected`
anthropic[patch]: release 0.1.9, use tool calls if content is empty (#20535) 2024-04-16 22:27:29 +00:00

			`def test__format_messages_with_tool_calls() -> None:`
			`system = SystemMessage("fuzz")`
			`human = HumanMessage("foo")`
			`ai = AIMessage(`
			`"",`
			`tool_calls=[{"name": "bar", "id": "1", "args": {"baz": "buzz"}}],`
			`)`
			`tool = ToolMessage(`
			`"blurb",`
			`tool_call_id="1",`
			`)`
			`messages = [system, human, ai, tool]`
			`expected = (`
			`"fuzz",`
			`[`
			`{"role": "user", "content": "foo"},`
			`{`
			`"role": "assistant",`
			`"content": [`
			`{`
			`"type": "tool_use",`
			`"name": "bar",`
			`"id": "1",`
			`"input": {"baz": "buzz"},`
			`}`
			`],`
			`},`
			`{`
			`"role": "user",`
			`"content": [`
			`{"type": "tool_result", "content": "blurb", "tool_use_id": "1"}`
			`],`
			`},`
			`],`
			`)`
			`actual = _format_messages(messages)`
			`assert expected == actual`


			`def test__format_messages_with_str_content_and_tool_calls() -> None:`
			`system = SystemMessage("fuzz")`
			`human = HumanMessage("foo")`
			`# If content and tool_calls are specified and content is a string, then both are`
			`# included with content first.`
			`ai = AIMessage(`
			`"thought",`
			`tool_calls=[{"name": "bar", "id": "1", "args": {"baz": "buzz"}}],`
			`)`
			`tool = ToolMessage(`
			`"blurb",`
			`tool_call_id="1",`
			`)`
			`messages = [system, human, ai, tool]`
			`expected = (`
			`"fuzz",`
			`[`
			`{"role": "user", "content": "foo"},`
			`{`
			`"role": "assistant",`
			`"content": [`
			`{`
			`"type": "text",`
			`"text": "thought",`
			`},`
			`{`
			`"type": "tool_use",`
			`"name": "bar",`
			`"id": "1",`
			`"input": {"baz": "buzz"},`
			`},`
			`],`
			`},`
			`{`
			`"role": "user",`
			`"content": [`
			`{"type": "tool_result", "content": "blurb", "tool_use_id": "1"}`
			`],`
			`},`
			`],`
			`)`
			`actual = _format_messages(messages)`
			`assert expected == actual`


			`def test__format_messages_with_list_content_and_tool_calls() -> None:`
			`system = SystemMessage("fuzz")`
			`human = HumanMessage("foo")`
			`# If content and tool_calls are specified and content is a list, then content is`
			`# preferred.`
			`ai = AIMessage(`
			`[`
			`{`
			`"type": "text",`
			`"text": "thought",`
			`}`
			`],`
			`tool_calls=[{"name": "bar", "id": "1", "args": {"baz": "buzz"}}],`
			`)`
			`tool = ToolMessage(`
			`"blurb",`
			`tool_call_id="1",`
			`)`
			`messages = [system, human, ai, tool]`
			`expected = (`
			`"fuzz",`
			`[`
			`{"role": "user", "content": "foo"},`
			`{`
			`"role": "assistant",`
			`"content": [`
			`{`
			`"type": "text",`
			`"text": "thought",`
			`}`
			`],`
			`},`
			`{`
			`"role": "user",`
			`"content": [`
			`{"type": "tool_result", "content": "blurb", "tool_use_id": "1"}`
			`],`
			`},`
			`],`
			`)`
			`actual = _format_messages(messages)`
			`assert expected == actual`