Add LCP Client (#4198)

Adding a client to fetch datasets, examples, and runs from a LCP instance and run objects over them.
1 year ago · 1017e5cee2
parent a30f42da4e
commit 1017e5cee2
7 changed files with 950 additions and 0 deletions
--- a/langchain/client/init.py
+++ b/langchain/client/init.py
@ -0,0 +1,6 @@
+"""LangChain+ Client."""
+
+
+from langchain.client.langchain import LangChainPlusClient
+
+__all__ = ["LangChainPlusClient"]
--- a/langchain/client/langchain.py
+++ b/langchain/client/langchain.py
@ -0,0 +1,544 @@
+from __future__ import annotations
+
+import asyncio
+import functools
+import logging
+import socket
+from datetime import datetime
+from io import BytesIO
+from typing import (
+    TYPE_CHECKING,
+    Any,
+    Callable,
+    Coroutine,
+    Dict,
+    Iterable,
+    List,
+    Optional,
+    Tuple,
+    Union,
+)
+from urllib.parse import urlsplit
+from uuid import UUID
+
+import requests
+from pydantic import BaseSettings, Field, root_validator
+from requests import Response
+
+from langchain.base_language import BaseLanguageModel
+from langchain.callbacks.manager import tracing_v2_enabled
+from langchain.callbacks.tracers.langchain import LangChainTracerV2
+from langchain.chains.base import Chain
+from langchain.chat_models.base import BaseChatModel
+from langchain.client.models import Dataset, DatasetCreate, Example, ExampleCreate
+from langchain.client.utils import parse_chat_messages
+from langchain.llms.base import BaseLLM
+from langchain.schema import ChatResult, LLMResult
+from langchain.utils import raise_for_status_with_text, xor_args
+
+if TYPE_CHECKING:
+    import pandas as pd
+
+logger = logging.getLogger(__name__)
+
+
+def _get_link_stem(url: str) -> str:
+    scheme = urlsplit(url).scheme
+    netloc_prefix = urlsplit(url).netloc.split(":")[0]
+    return f"{scheme}://{netloc_prefix}"
+
+
+def _is_localhost(url: str) -> bool:
+    """Check if the URL is localhost."""
+    try:
+        netloc = urlsplit(url).netloc.split(":")[0]
+        ip = socket.gethostbyname(netloc)
+        return ip == "127.0.0.1" or ip.startswith("0.0.0.0") or ip.startswith("::")
+    except socket.gaierror:
+        return False
+
+
+class LangChainPlusClient(BaseSettings):
+    """Client for interacting with the LangChain+ API."""
+
+    api_key: Optional[str] = Field(default=None, env="LANGCHAIN_API_KEY")
+    api_url: str = Field(..., env="LANGCHAIN_ENDPOINT")
+    tenant_id: str = Field(..., env="LANGCHAIN_TENANT_ID")
+
+    @root_validator(pre=True)
+    def validate_api_key_if_hosted(cls, values: Dict[str, Any]) -> Dict[str, Any]:
+        """Verify API key is provided if url not localhost."""
+        api_url: str = values.get("api_url", "http://localhost:8000")
+        api_key: Optional[str] = values.get("api_key")
+        if not _is_localhost(api_url):
+            if not api_key:
+                raise ValueError(
+                    "API key must be provided when using hosted LangChain+ API"
+                )
+        else:
+            tenant_id = values.get("tenant_id")
+            if not tenant_id:
+                values["tenant_id"] = LangChainPlusClient._get_seeded_tenant_id(
+                    api_url, api_key
+                )
+        return values
+
+    @staticmethod
+    def _get_seeded_tenant_id(api_url: str, api_key: Optional[str]) -> str:
+        """Get the tenant ID from the seeded tenant."""
+        url = f"{api_url}/tenants"
+        headers = {"authorization": f"Bearer {api_key}"} if api_key else {}
+        response = requests.get(url, headers=headers)
+        try:
+            raise_for_status_with_text(response)
+        except Exception as e:
+            raise ValueError(
+                "Unable to get seeded tenant ID. Please manually provide."
+            ) from e
+        results: List[dict] = response.json()
+        breakpoint()
+        if len(results) == 0:
+            raise ValueError("No seeded tenant found")
+        return results[0]["id"]
+
+    def _repr_html_(self) -> str:
+        """Return an HTML representation of the instance with a link to the URL."""
+        link = _get_link_stem(self.api_url)
+        return f'<a href="{link}", target="_blank" rel="noopener">LangChain+ Client</a>'
+
+    def __repr__(self) -> str:
+        """Return a string representation of the instance with a link to the URL."""
+        return f"LangChainPlusClient (API URL: {self.api_url})"
+
+    @property
+    def _headers(self) -> Dict[str, str]:
+        """Get the headers for the API request."""
+        headers = {}
+        if self.api_key:
+            headers["authorization"] = f"Bearer {self.api_key}"
+        return headers
+
+    @property
+    def query_params(self) -> Dict[str, str]:
+        """Get the headers for the API request."""
+        return {"tenant_id": self.tenant_id}
+
+    def _get(self, path: str, params: Optional[Dict[str, Any]] = None) -> Response:
+        """Make a GET request."""
+        query_params = self.query_params
+        if params:
+            query_params.update(params)
+        return requests.get(
+            f"{self.api_url}{path}", headers=self._headers, params=query_params
+        )
+
+    def upload_dataframe(
+        self,
+        df: pd.DataFrame,
+        name: str,
+        description: str,
+        input_keys: List[str],
+        output_keys: List[str],
+    ) -> Dataset:
+        """Upload a dataframe as individual examples to the LangChain+ API."""
+        dataset = self.create_dataset(dataset_name=name, description=description)
+        for row in df.itertuples():
+            inputs = {key: getattr(row, key) for key in input_keys}
+            outputs = {key: getattr(row, key) for key in output_keys}
+            self.create_example(inputs, outputs=outputs, dataset_id=dataset.id)
+        return dataset
+
+    def upload_csv(
+        self,
+        csv_file: Union[str, Tuple[str, BytesIO]],
+        description: str,
+        input_keys: List[str],
+        output_keys: List[str],
+    ) -> Dataset:
+        """Upload a CSV file to the LangChain+ API."""
+        files = {"file": csv_file}
+        data = {
+            "input_keys": ",".join(input_keys),
+            "output_keys": ",".join(output_keys),
+            "description": description,
+            "tenant_id": self.tenant_id,
+        }
+        response = requests.post(
+            self.api_url + "/datasets/upload",
+            headers=self._headers,
+            data=data,
+            files=files,
+        )
+        raise_for_status_with_text(response)
+        result = response.json()
+        # TODO: Make this more robust server-side
+        if "detail" in result and "already exists" in result["detail"]:
+            file_name = csv_file if isinstance(csv_file, str) else csv_file[0]
+            file_name = file_name.split("/")[-1]
+            raise ValueError(f"Dataset {file_name} already exists")
+        return Dataset(**result)
+
+    def create_dataset(self, dataset_name: str, description: str) -> Dataset:
+        """Create a dataset in the LangChain+ API."""
+        dataset = DatasetCreate(
+            tenant_id=self.tenant_id,
+            name=dataset_name,
+            description=description,
+        )
+        response = requests.post(
+            self.api_url + "/datasets",
+            headers=self._headers,
+            data=dataset.json(),
+        )
+        raise_for_status_with_text(response)
+        return Dataset(**response.json())
+
+    @xor_args(("dataset_name", "dataset_id"))
+    def read_dataset(
+        self, *, dataset_name: Optional[str] = None, dataset_id: Optional[str] = None
+    ) -> Dataset:
+        path = "/datasets"
+        params: Dict[str, Any] = {"limit": 1, "tenant_id": self.tenant_id}
+        if dataset_id is not None:
+            path += f"/{dataset_id}"
+        elif dataset_name is not None:
+            params["name"] = dataset_name
+        else:
+            raise ValueError("Must provide dataset_name or dataset_id")
+        response = self._get(
+            path,
+            params=params,
+        )
+        raise_for_status_with_text(response)
+        result = response.json()
+        if isinstance(result, list):
+            if len(result) == 0:
+                raise ValueError(f"Dataset {dataset_name} not found")
+            return Dataset(**result[0])
+        return Dataset(**result)
+
+    def list_datasets(self, limit: int = 100) -> Iterable[Dataset]:
+        """List the datasets on the LangChain+ API."""
+        response = self._get("/datasets", params={"limit": limit})
+        raise_for_status_with_text(response)
+        return [Dataset(**dataset) for dataset in response.json()]
+
+    @xor_args(("dataset_id", "dataset_name"))
+    def delete_dataset(
+        self, *, dataset_id: Optional[str] = None, dataset_name: Optional[str] = None
+    ) -> Dataset:
+        """Delete a dataset by ID or name."""
+        if dataset_name is not None:
+            dataset_id = self.read_dataset(dataset_name=dataset_name).id
+        if dataset_id is None:
+            raise ValueError("Must provide either dataset name or ID")
+        response = requests.delete(
+            f"{self.api_url}/datasets/{dataset_id}",
+            headers=self._headers,
+        )
+        raise_for_status_with_text(response)
+        return response.json()
+
+    @xor_args(("dataset_id", "dataset_name"))
+    def create_example(
+        self,
+        inputs: Dict[str, Any],
+        dataset_id: Optional[UUID] = None,
+        dataset_name: Optional[str] = None,
+        created_at: Optional[datetime] = None,
+        outputs: Dict[str, Any] | None = None,
+    ) -> Example:
+        """Create a dataset example in the LangChain+ API."""
+        if dataset_id is None:
+            dataset_id = self.read_dataset(dataset_name).id
+
+        data = {
+            "inputs": inputs,
+            "outputs": outputs,
+            "dataset_id": dataset_id,
+        }
+        if created_at:
+            data["created_at"] = created_at.isoformat()
+        example = ExampleCreate(**data)
+        response = requests.post(
+            f"{self.api_url}/examples", headers=self._headers, data=example.json()
+        )
+        raise_for_status_with_text(response)
+        result = response.json()
+        return Example(**result)
+
+    def read_example(self, example_id: str) -> Example:
+        """Read an example from the LangChain+ API."""
+        response = self._get(f"/examples/{example_id}")
+        raise_for_status_with_text(response)
+        return Example(**response.json())
+
+    def list_examples(
+        self, dataset_id: Optional[str] = None, dataset_name: Optional[str] = None
+    ) -> Iterable[Example]:
+        """List the datasets on the LangChain+ API."""
+        params = {}
+        if dataset_id is not None:
+            params["dataset"] = dataset_id
+        elif dataset_name is not None:
+            dataset_id = self.read_dataset(dataset_name=dataset_name).id
+            params["dataset"] = dataset_id
+        else:
+            pass
+        response = self._get("/examples", params=params)
+        raise_for_status_with_text(response)
+        return [Example(**dataset) for dataset in response.json()]
+
+    @staticmethod
+    async def _arun_llm(
+        llm: BaseLanguageModel,
+        inputs: Dict[str, Any],
+        langchain_tracer: LangChainTracerV2,
+    ) -> Union[LLMResult, ChatResult]:
+        if isinstance(llm, BaseLLM):
+            llm_prompts: List[str] = inputs["prompts"]
+            llm_output = await llm.agenerate(llm_prompts, callbacks=[langchain_tracer])
+        elif isinstance(llm, BaseChatModel):
+            chat_prompts: List[str] = inputs["prompts"]
+            messages = [
+                parse_chat_messages(chat_prompt) for chat_prompt in chat_prompts
+            ]
+            llm_output = await llm.agenerate(messages, callbacks=[langchain_tracer])
+        else:
+            raise ValueError(f"Unsupported LLM type {type(llm)}")
+        return llm_output
+
+    @staticmethod
+    async def _arun_llm_or_chain(
+        example: Example,
+        langchain_tracer: LangChainTracerV2,
+        llm_or_chain: Union[Chain, BaseLanguageModel],
+        n_repetitions: int,
+    ) -> Union[List[dict], List[str], List[LLMResult], List[ChatResult]]:
+        """Run the chain asynchronously."""
+        previous_example_id = langchain_tracer.example_id
+        langchain_tracer.example_id = example.id
+        outputs = []
+        for _ in range(n_repetitions):
+            try:
+                if isinstance(llm_or_chain, BaseLanguageModel):
+                    output: Any = await LangChainPlusClient._arun_llm(
+                        llm_or_chain, example.inputs, langchain_tracer
+                    )
+                else:
+                    output = await llm_or_chain.arun(
+                        example.inputs, callbacks=[langchain_tracer]
+                    )
+                outputs.append(output)
+            except Exception as e:
+                logger.warning(f"Chain failed for example {example.id}. Error: {e}")
+                outputs.append({"Error": str(e)})
+            finally:
+                langchain_tracer.example_id = previous_example_id
+        return outputs
+
+    @staticmethod
+    async def _gather_with_concurrency(
+        n: int,
+        initializer: Callable[[], Coroutine[Any, Any, Tuple[LangChainTracerV2, Dict]]],
+        *async_funcs: Callable[[LangChainTracerV2, Dict], Coroutine[Any, Any, Any]],
+    ) -> List[Any]:
+        """
+        Run coroutines with a concurrency limit.
+
+        Args:
+            n: The maximum number of concurrent tasks.
+            initializer: A coroutine that initializes shared resources for the tasks.
+            async_funcs: The async_funcs to be run concurrently.
+
+        Returns:
+            A list of results from the coroutines.
+        """
+        semaphore = asyncio.Semaphore(n)
+        tracer, job_state = await initializer()
+
+        async def run_coroutine_with_semaphore(
+            async_func: Callable[[LangChainTracerV2, Dict], Coroutine[Any, Any, Any]]
+        ) -> Any:
+            async with semaphore:
+                return await async_func(tracer, job_state)
+
+        return await asyncio.gather(
+            *(run_coroutine_with_semaphore(function) for function in async_funcs)
+        )
+
+    async def _tracer_initializer(
+        self, session_name: str
+    ) -> Tuple[LangChainTracerV2, dict]:
+        """
+        Initialize a tracer to share across tasks.
+
+        Args:
+            session_name: The session name for the tracer.
+
+        Returns:
+            A LangChainTracerV2 instance with an active session.
+        """
+        job_state = {"num_processed": 0}
+        with tracing_v2_enabled(session_name=session_name) as session:
+            tracer = LangChainTracerV2()
+            tracer.session = session
+            return tracer, job_state
+
+    async def arun_on_dataset(
+        self,
+        dataset_name: str,
+        llm_or_chain: Union[Chain, BaseLanguageModel],
+        concurrency_level: int = 5,
+        num_repetitions: int = 1,
+        session_name: Optional[str] = None,
+        verbose: bool = False,
+    ) -> Dict[str, Any]:
+        """
+        Run the chain on a dataset and store traces to the specified session name.
+
+        Args:
+            dataset_name: Name of the dataset to run the chain on.
+            llm_or_chain: Chain or language model to run over the dataset.
+            concurrency_level: The number of async tasks to run concurrently.
+            num_repetitions: Number of times to run the model on each example.
+                This is useful when testing success rates or generating confidence
+                intervals.
+            session_name: Name of the session to store the traces in.
+                Defaults to {dataset_name}-{chain class name}-{datetime}.
+            verbose: Whether to print progress.
+
+        Returns:
+            A dictionary mapping example ids to the model outputs.
+        """
+        if session_name is None:
+            current_time = datetime.now().strftime("%Y-%m-%d-%H-%M-%S")
+            session_name = (
+                f"{dataset_name}-{llm_or_chain.__class__.__name__}-{current_time}"
+            )
+        dataset = self.read_dataset(dataset_name=dataset_name)
+        examples = self.list_examples(dataset_id=str(dataset.id))
+        results: Dict[str, List[Any]] = {}
+
+        async def process_example(
+            example: Example, tracer: LangChainTracerV2, job_state: dict
+        ) -> None:
+            """Process a single example."""
+            result = await LangChainPlusClient._arun_llm_or_chain(
+                example,
+                tracer,
+                llm_or_chain,
+                num_repetitions,
+            )
+            results[str(example.id)] = result
+            job_state["num_processed"] += 1
+            if verbose:
+                print(
+                    f"Processed examples: {job_state['num_processed']}",
+                    end="\r",
+                    flush=True,
+                )
+
+        await self._gather_with_concurrency(
+            concurrency_level,
+            functools.partial(self._tracer_initializer, session_name),
+            *(functools.partial(process_example, e) for e in examples),
+        )
+        return results
+
+    @staticmethod
+    def run_llm(
+        llm: BaseLanguageModel,
+        inputs: Dict[str, Any],
+        langchain_tracer: LangChainTracerV2,
+    ) -> Union[LLMResult, ChatResult]:
+        """Run the language model on the example."""
+        if isinstance(llm, BaseLLM):
+            llm_prompts: List[str] = inputs["prompts"]
+            llm_output = llm.generate(llm_prompts, callbacks=[langchain_tracer])
+        elif isinstance(llm, BaseChatModel):
+            chat_prompts: List[str] = inputs["prompts"]
+            messages = [
+                parse_chat_messages(chat_prompt) for chat_prompt in chat_prompts
+            ]
+            llm_output = llm.generate(messages, callbacks=[langchain_tracer])
+        else:
+            raise ValueError(f"Unsupported LLM type {type(llm)}")
+        return llm_output
+
+    @staticmethod
+    def run_llm_or_chain(
+        example: Example,
+        langchain_tracer: LangChainTracerV2,
+        llm_or_chain: Union[Chain, BaseLanguageModel],
+        n_repetitions: int,
+    ) -> Union[List[dict], List[str], List[LLMResult], List[ChatResult]]:
+        """Run the chain synchronously."""
+        previous_example_id = langchain_tracer.example_id
+        langchain_tracer.example_id = example.id
+        outputs = []
+        for _ in range(n_repetitions):
+            try:
+                if isinstance(llm_or_chain, BaseLanguageModel):
+                    output: Any = LangChainPlusClient.run_llm(
+                        llm_or_chain, example.inputs, langchain_tracer
+                    )
+                else:
+                    output = llm_or_chain.run(
+                        example.inputs, callbacks=[langchain_tracer]
+                    )
+                outputs.append(output)
+            except Exception as e:
+                logger.warning(f"Chain failed for example {example.id}. Error: {e}")
+                outputs.append({"Error": str(e)})
+            finally:
+                langchain_tracer.example_id = previous_example_id
+        return outputs
+
+    def run_on_dataset(
+        self,
+        dataset_name: str,
+        llm_or_chain: Union[Chain, BaseLanguageModel],
+        num_repetitions: int = 1,
+        session_name: Optional[str] = None,
+        verbose: bool = False,
+    ) -> Dict[str, Any]:
+        """Run the chain on a dataset and store traces to the specified session name.
+
+        Args:
+            dataset_name: Name of the dataset to run the chain on.
+            llm_or_chain: Chain or language model to run over the dataset.
+            concurrency_level: Number of async workers to run in parallel.
+            num_repetitions: Number of times to run the model on each example.
+                This is useful when testing success rates or generating confidence
+                intervals.
+            session_name: Name of the session to store the traces in.
+                Defaults to {dataset_name}-{chain class name}-{datetime}.
+            verbose: Whether to print progress.
+
+        Returns:
+            A dictionary mapping example ids to the model outputs.
+        """
+        if session_name is None:
+            current_time = datetime.now().strftime("%Y-%m-%d-%H-%M-%S")
+            session_name = (
+                f"{dataset_name}-{llm_or_chain.__class__.__name__}-{current_time}"
+            )
+        dataset = self.read_dataset(dataset_name=dataset_name)
+        examples = self.list_examples(dataset_id=str(dataset.id))
+        results: Dict[str, Any] = {}
+        with tracing_v2_enabled(session_name=session_name) as session:
+            tracer = LangChainTracerV2()
+            tracer.session = session
+
+            for i, example in enumerate(examples):
+                result = self.run_llm_or_chain(
+                    example,
+                    tracer,
+                    llm_or_chain,
+                    num_repetitions,
+                )
+                if verbose:
+                    print(f"{i+1} processed", flush=True, end="\r")
+            results[str(example.id)] = result
+        return results
--- a/langchain/client/models.py
+++ b/langchain/client/models.py
@ -0,0 +1,54 @@
+from datetime import datetime
+from typing import Any, Dict, List, Optional
+from uuid import UUID
+
+from pydantic import BaseModel, Field
+
+from langchain.callbacks.tracers.schemas import Run
+
+
+class ExampleBase(BaseModel):
+    """Example base model."""
+
+    dataset_id: UUID
+    inputs: Dict[str, Any]
+    outputs: Optional[Dict[str, Any]] = Field(default=None)
+
+
+class ExampleCreate(ExampleBase):
+    """Example create model."""
+
+    id: Optional[UUID]
+    created_at: datetime = Field(default_factory=datetime.utcnow)
+
+
+class Example(ExampleBase):
+    """Example model."""
+
+    id: UUID
+    created_at: datetime
+    modified_at: Optional[datetime] = Field(default=None)
+    runs: List[Run] = Field(default_factory=list)
+
+
+class DatasetBase(BaseModel):
+    """Dataset base model."""
+
+    tenant_id: UUID
+    name: str
+    description: str
+
+
+class DatasetCreate(DatasetBase):
+    """Dataset create model."""
+
+    id: Optional[UUID]
+    created_at: datetime = Field(default_factory=datetime.utcnow)
+
+
+class Dataset(DatasetBase):
+    """Dataset ORM model."""
+
+    id: UUID
+    created_at: datetime
+    modified_at: Optional[datetime] = Field(default=None)
--- a/langchain/client/utils.py
+++ b/langchain/client/utils.py
@ -0,0 +1,42 @@
+"""Client Utils."""
+import re
+from typing import Dict, List, Optional, Sequence, Type, Union
+
+from langchain.schema import (
+    AIMessage,
+    BaseMessage,
+    ChatMessage,
+    HumanMessage,
+    SystemMessage,
+)
+
+_DEFAULT_MESSAGES_T = Union[Type[HumanMessage], Type[SystemMessage], Type[AIMessage]]
+_RESOLUTION_MAP: Dict[str, _DEFAULT_MESSAGES_T] = {
+    "Human": HumanMessage,
+    "AI": AIMessage,
+    "System": SystemMessage,
+}
+
+
+def parse_chat_messages(
+    input_text: str, roles: Optional[Sequence[str]] = None
+) -> List[BaseMessage]:
+    """Parse chat messages from a string. This is not robust."""
+    roles = roles or ["Human", "AI", "System"]
+    roles_pattern = "|".join(roles)
+    pattern = (
+        rf"(?P<entity>{roles_pattern}): (?P<message>"
+        rf"(?:.*\n?)*?)(?=(?:{roles_pattern}): |\Z)"
+    )
+    matches = re.finditer(pattern, input_text, re.MULTILINE)
+
+    results: List[BaseMessage] = []
+    for match in matches:
+        entity = match.group("entity")
+        message = match.group("message").rstrip("\n")
+        if entity in _RESOLUTION_MAP:
+            results.append(_RESOLUTION_MAP[entity](content=message))
+        else:
+            results.append(ChatMessage(role=entity, content=message))
+
+    return results
--- a/tests/unit_tests/client/init.py
+++ b/tests/unit_tests/client/init.py
--- a/tests/unit_tests/client/test_langchain.py
+++ b/tests/unit_tests/client/test_langchain.py
@ -0,0 +1,234 @@
+"""Test the LangChain+ client."""
+import uuid
+from datetime import datetime
+from io import BytesIO
+from typing import Any, Dict, List, Optional, Union
+from unittest import mock
+
+import pytest
+
+from langchain.base_language import BaseLanguageModel
+from langchain.callbacks.tracers.langchain import LangChainTracerV2
+from langchain.callbacks.tracers.schemas import TracerSessionV2
+from langchain.chains.base import Chain
+from langchain.client.langchain import (
+    LangChainPlusClient,
+    _get_link_stem,
+    _is_localhost,
+)
+from langchain.client.models import Dataset, Example
+
+_CREATED_AT = datetime(2015, 1, 1, 0, 0, 0)
+_TENANT_ID = "7a3d2b56-cd5b-44e5-846f-7eb6e8144ce4"
+
+
+@pytest.mark.parametrize(
+    "api_url, expected_url",
+    [
+        ("http://localhost:8000", "http://localhost"),
+        ("http://www.example.com", "http://www.example.com"),
+        (
+            "https://hosted-1234-23qwerty.f.234.foobar.gateway.dev",
+            "https://hosted-1234-23qwerty.f.234.foobar.gateway.dev",
+        ),
+        ("https://www.langchain.com/path/to/nowhere", "https://www.langchain.com"),
+    ],
+)
+def test_link_split(api_url: str, expected_url: str) -> None:
+    """Test the link splitting handles both localhost and deployed urls."""
+    assert _get_link_stem(api_url) == expected_url
+
+
+def test_is_localhost() -> None:
+    assert _is_localhost("http://localhost:8000")
+    assert _is_localhost("http://127.0.0.1:8000")
+    assert _is_localhost("http://0.0.0.0:8000")
+    assert not _is_localhost("http://example.com:8000")
+
+
+def test_validate_api_key_if_hosted() -> None:
+    def mock_get_seeded_tenant_id(api_url: str, api_key: Optional[str]) -> str:
+        return _TENANT_ID
+
+    with mock.patch.object(
+        LangChainPlusClient, "_get_seeded_tenant_id", new=mock_get_seeded_tenant_id
+    ):
+        with pytest.raises(ValueError, match="API key must be provided"):
+            LangChainPlusClient(api_url="http://www.example.com")
+
+    with mock.patch.object(
+        LangChainPlusClient, "_get_seeded_tenant_id", new=mock_get_seeded_tenant_id
+    ):
+        client = LangChainPlusClient(api_url="http://localhost:8000")
+        assert client.api_url == "http://localhost:8000"
+        assert client.api_key is None
+
+
+def test_headers() -> None:
+    def mock_get_seeded_tenant_id(api_url: str, api_key: Optional[str]) -> str:
+        return _TENANT_ID
+
+    with mock.patch.object(
+        LangChainPlusClient, "_get_seeded_tenant_id", new=mock_get_seeded_tenant_id
+    ):
+        client = LangChainPlusClient(api_url="http://localhost:8000", api_key="123")
+        assert client._headers == {"authorization": "Bearer 123"}
+
+    with mock.patch.object(
+        LangChainPlusClient, "_get_seeded_tenant_id", new=mock_get_seeded_tenant_id
+    ):
+        client_no_key = LangChainPlusClient(api_url="http://localhost:8000")
+        assert client_no_key._headers == {}
+
+
+@mock.patch("langchain.client.langchain.requests.post")
+def test_upload_csv(mock_post: mock.Mock) -> None:
+    mock_response = mock.Mock()
+    dataset_id = str(uuid.uuid4())
+    example_1 = Example(
+        id=str(uuid.uuid4()),
+        created_at=_CREATED_AT,
+        inputs={"input": "1"},
+        outputs={"output": "2"},
+        dataset_id=dataset_id,
+    )
+    example_2 = Example(
+        id=str(uuid.uuid4()),
+        created_at=_CREATED_AT,
+        inputs={"input": "3"},
+        outputs={"output": "4"},
+        dataset_id=dataset_id,
+    )
+
+    mock_response.json.return_value = {
+        "id": dataset_id,
+        "name": "test.csv",
+        "description": "Test dataset",
+        "owner_id": "the owner",
+        "created_at": _CREATED_AT,
+        "examples": [example_1, example_2],
+        "tenant_id": _TENANT_ID,
+    }
+    mock_post.return_value = mock_response
+
+    client = LangChainPlusClient(
+        api_url="http://localhost:8000", api_key="123", tenant_id=_TENANT_ID
+    )
+    csv_file = ("test.csv", BytesIO(b"input,output\n1,2\n3,4\n"))
+
+    dataset = client.upload_csv(
+        csv_file, "Test dataset", input_keys=["input"], output_keys=["output"]
+    )
+
+    assert dataset.id == uuid.UUID(dataset_id)
+    assert dataset.name == "test.csv"
+    assert dataset.description == "Test dataset"
+
+
+@pytest.mark.asyncio
+async def test_arun_on_dataset(monkeypatch: pytest.MonkeyPatch) -> None:
+    dataset = Dataset(
+        id=uuid.uuid4(),
+        name="test",
+        description="Test dataset",
+        owner_id="owner",
+        created_at=_CREATED_AT,
+        tenant_id=_TENANT_ID,
+    )
+    uuids = [
+        "0c193153-2309-4704-9a47-17aee4fb25c8",
+        "0d11b5fd-8e66-4485-b696-4b55155c0c05",
+        "90d696f0-f10d-4fd0-b88b-bfee6df08b84",
+        "4ce2c6d8-5124-4c0c-8292-db7bdebcf167",
+        "7b5a524c-80fa-4960-888e-7d380f9a11ee",
+    ]
+    examples = [
+        Example(
+            id=uuids[0],
+            created_at=_CREATED_AT,
+            inputs={"input": "1"},
+            outputs={"output": "2"},
+            dataset_id=str(uuid.uuid4()),
+        ),
+        Example(
+            id=uuids[1],
+            created_at=_CREATED_AT,
+            inputs={"input": "3"},
+            outputs={"output": "4"},
+            dataset_id=str(uuid.uuid4()),
+        ),
+        Example(
+            id=uuids[2],
+            created_at=_CREATED_AT,
+            inputs={"input": "5"},
+            outputs={"output": "6"},
+            dataset_id=str(uuid.uuid4()),
+        ),
+        Example(
+            id=uuids[3],
+            created_at=_CREATED_AT,
+            inputs={"input": "7"},
+            outputs={"output": "8"},
+            dataset_id=str(uuid.uuid4()),
+        ),
+        Example(
+            id=uuids[4],
+            created_at=_CREATED_AT,
+            inputs={"input": "9"},
+            outputs={"output": "10"},
+            dataset_id=str(uuid.uuid4()),
+        ),
+    ]
+
+    def mock_read_dataset(*args: Any, **kwargs: Any) -> Dataset:
+        return dataset
+
+    def mock_list_examples(*args: Any, **kwargs: Any) -> List[Example]:
+        return examples
+
+    async def mock_arun_chain(
+        example: Example,
+        tracer: Any,
+        llm_or_chain: Union[BaseLanguageModel, Chain],
+        n_repetitions: int,
+    ) -> List[Dict[str, Any]]:
+        return [
+            {"result": f"Result for example {example.id}"} for _ in range(n_repetitions)
+        ]
+
+    def mock_load_session(
+        self: Any, name: str, *args: Any, **kwargs: Any
+    ) -> TracerSessionV2:
+        return TracerSessionV2(name=name, tenant_id=_TENANT_ID, id=uuid.uuid4())
+
+    with mock.patch.object(
+        LangChainPlusClient, "read_dataset", new=mock_read_dataset
+    ), mock.patch.object(
+        LangChainPlusClient, "list_examples", new=mock_list_examples
+    ), mock.patch.object(
+        LangChainPlusClient, "_arun_llm_or_chain", new=mock_arun_chain
+    ), mock.patch.object(
+        LangChainTracerV2, "load_session", new=mock_load_session
+    ):
+        monkeypatch.setenv("LANGCHAIN_TENANT_ID", _TENANT_ID)
+        client = LangChainPlusClient(
+            api_url="http://localhost:8000", api_key="123", tenant_id=_TENANT_ID
+        )
+        chain = mock.MagicMock()
+        num_repetitions = 3
+        results = await client.arun_on_dataset(
+            dataset_name="test",
+            llm_or_chain=chain,
+            concurrency_level=2,
+            session_name="test_session",
+            num_repetitions=num_repetitions,
+        )
+
+        expected = {
+            uuid_: [
+                {"result": f"Result for example {uuid.UUID(uuid_)}"}
+                for _ in range(num_repetitions)
+            ]
+            for uuid_ in uuids
+        }
+        assert results == expected
--- a/tests/unit_tests/client/test_utils.py
+++ b/tests/unit_tests/client/test_utils.py
@ -0,0 +1,70 @@
+"""Test LangChain+ Client Utils."""
+
+from typing import List
+
+from langchain.client.utils import parse_chat_messages
+from langchain.schema import (
+    AIMessage,
+    BaseMessage,
+    ChatMessage,
+    HumanMessage,
+    SystemMessage,
+)
+
+
+def test_parse_chat_messages() -> None:
+    """Test that chat messages are parsed correctly."""
+    input_text = (
+        "Human: I am human roar\nAI: I am AI beep boop\nSystem: I am a system message"
+    )
+    expected = [
+        HumanMessage(content="I am human roar"),
+        AIMessage(content="I am AI beep boop"),
+        SystemMessage(content="I am a system message"),
+    ]
+    assert parse_chat_messages(input_text) == expected
+
+
+def test_parse_chat_messages_empty_input() -> None:
+    """Test that an empty input string returns an empty list."""
+    input_text = ""
+    expected: List[BaseMessage] = []
+    assert parse_chat_messages(input_text) == expected
+
+
+def test_parse_chat_messages_multiline_messages() -> None:
+    """Test that multiline messages are parsed correctly."""
+    input_text = (
+        "Human: I am a human\nand I roar\nAI: I am an AI\nand I"
+        " beep boop\nSystem: I am a system\nand a message"
+    )
+    expected = [
+        HumanMessage(content="I am a human\nand I roar"),
+        AIMessage(content="I am an AI\nand I beep boop"),
+        SystemMessage(content="I am a system\nand a message"),
+    ]
+    assert parse_chat_messages(input_text) == expected
+
+
+def test_parse_chat_messages_custom_roles() -> None:
+    """Test that custom roles are parsed correctly."""
+    input_text = "Client: I need help\nAgent: I'm here to help\nClient: Thank you"
+    expected = [
+        ChatMessage(role="Client", content="I need help"),
+        ChatMessage(role="Agent", content="I'm here to help"),
+        ChatMessage(role="Client", content="Thank you"),
+    ]
+    assert parse_chat_messages(input_text, roles=["Client", "Agent"]) == expected
+
+
+def test_parse_chat_messages_embedded_roles() -> None:
+    """Test that messages with embedded role references are parsed correctly."""
+    input_text = (
+        "Human: Oh ai what if you said AI: foo bar?"
+        "\nAI: Well, that would be interesting!"
+    )
+    expected = [
+        HumanMessage(content="Oh ai what if you said AI: foo bar?"),
+        AIMessage(content="Well, that would be interesting!"),
+    ]
+    assert parse_chat_messages(input_text) == expected