From 37a89918e02f16b889f3d0cf99f0c23a1eb9fbfb Mon Sep 17 00:00:00 2001 From: Naman Modi Date: Wed, 21 Jun 2023 14:08:20 +0530 Subject: [PATCH] Infino integration for simplified logs, metrics & search across LLM data & token usage (#6218) ### Integration of Infino with LangChain for Enhanced Observability This PR aims to integrate [Infino](https://github.com/infinohq/infino), an open source observability platform written in rust for storing metrics and logs at scale, with LangChain, providing users with a streamlined and efficient method of tracking and recording LangChain experiments. By incorporating Infino into LangChain, users will be able to gain valuable insights and easily analyze the behavior of their language models. #### Please refer to the following files related to integration: - `InfinoCallbackHandler`: A [callback handler](https://github.com/naman-modi/langchain/blob/feature/infino-integration/langchain/callbacks/infino_callback.py) specifically designed for storing chain responses within Infino. - Example `infino.ipynb` file: A comprehensive notebook named [infino.ipynb](https://github.com/naman-modi/langchain/blob/feature/infino-integration/docs/extras/modules/callbacks/integrations/infino.ipynb) has been included to guide users on effectively leveraging Infino for tracking LangChain requests. - [Integration Doc](https://github.com/naman-modi/langchain/blob/feature/infino-integration/docs/extras/ecosystem/integrations/infino.mdx) for Infino integration. By integrating Infino, LangChain users will gain access to powerful visualization and debugging capabilities. Infino enables easy tracking of inputs, outputs, token usage, execution time of LLMs. This comprehensive observability ensures a deeper understanding of individual executions and facilitates effective debugging. Co-authors: @vinaykakade @savannahar68 --------- Co-authored-by: Vinay Kakade --- docs/extras/ecosystem/integrations/infino.mdx | 35 ++ .../callbacks/integrations/infino.ipynb | 419 ++++++++++++++++++ langchain/callbacks/__init__.py | 2 + langchain/callbacks/infino_callback.py | 172 +++++++ 4 files changed, 628 insertions(+) create mode 100644 docs/extras/ecosystem/integrations/infino.mdx create mode 100644 docs/extras/modules/callbacks/integrations/infino.ipynb create mode 100644 langchain/callbacks/infino_callback.py diff --git a/docs/extras/ecosystem/integrations/infino.mdx b/docs/extras/ecosystem/integrations/infino.mdx new file mode 100644 index 00000000..dcca8af5 --- /dev/null +++ b/docs/extras/ecosystem/integrations/infino.mdx @@ -0,0 +1,35 @@ +# Infino + +>[Infino](https://github.com/infinohq/infino) is an open-source observability platform that stores both metrics and application logs together. + +Key features of infino include: +- Metrics Tracking: Capture time taken by LLM model to handle request, errors, number of tokens, and costing indication for the particular LLM. +- Data Tracking: Log and store prompt, request, and response data for each LangChain interaction. +- Graph Visualization: Generate basic graphs over time, depicting metrics such as request duration, error occurrences, token count, and cost. + +## Installation and Setup + +First, you'll need to install the `infinopy` Python package as follows: + +```bash +pip install infinopy +``` + +If you already have an Infino Server running, then you're good to go; but if +you don't, follow the next steps to start it: + +- Make sure you have Docker installed +- Run the following in your terminal: + ``` + docker run --rm --detach --name infino-example -p 3000:3000 infinohq/infino:latest + ``` + + + +## Using Infino + +See a [usage example of `InfinoCallbackHandler`](/docs/modules/callbacks/integrations/infino.html). + +```python +from langchain.callbacks import InfinoCallbackHandler +``` diff --git a/docs/extras/modules/callbacks/integrations/infino.ipynb b/docs/extras/modules/callbacks/integrations/infino.ipynb new file mode 100644 index 00000000..e619fc0e --- /dev/null +++ b/docs/extras/modules/callbacks/integrations/infino.ipynb @@ -0,0 +1,419 @@ +{ + "cells": [ + { + "attachments": {}, + "cell_type": "markdown", + "id": "8d10861f-a550-4443-bc63-4ce2ae13b841", + "metadata": {}, + "source": [ + "# Infino - LangChain LLM Monitoring Example\n", + "\n", + "This example shows how one can track the following while calling OpenAI models via LangChain and [Infino](https://github.com/infinohq/infino):\n", + "\n", + "* prompt input,\n", + "* response from chatgpt or any other LangChain model,\n", + "* latency,\n", + "* errors,\n", + "* number of tokens consumed" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "id": "3a5a0976-9953-41d8-880c-eb3f2992e936", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: matplotlib in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (3.7.1)\n", + "Requirement already satisfied: contourpy>=1.0.1 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (1.0.7)\n", + "Requirement already satisfied: cycler>=0.10 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (0.11.0)\n", + "Requirement already satisfied: fonttools>=4.22.0 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (4.39.4)\n", + "Requirement already satisfied: kiwisolver>=1.0.1 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (1.4.4)\n", + "Requirement already satisfied: numpy>=1.20 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (1.24.3)\n", + "Requirement already satisfied: packaging>=20.0 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (23.1)\n", + "Requirement already satisfied: pillow>=6.2.0 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (9.5.0)\n", + "Requirement already satisfied: pyparsing>=2.3.1 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (3.0.9)\n", + "Requirement already satisfied: python-dateutil>=2.7 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from matplotlib) (2.8.2)\n", + "Requirement already satisfied: six>=1.5 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from python-dateutil>=2.7->matplotlib) (1.16.0)\n", + "Requirement already satisfied: infinopy in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (0.0.1)\n", + "Requirement already satisfied: docker in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from infinopy) (6.1.3)\n", + "Requirement already satisfied: requests in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from infinopy) (2.31.0)\n", + "Requirement already satisfied: packaging>=14.0 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from docker->infinopy) (23.1)\n", + "Requirement already satisfied: urllib3>=1.26.0 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from docker->infinopy) (2.0.2)\n", + "Requirement already satisfied: websocket-client>=0.32.0 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from docker->infinopy) (1.5.2)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from requests->infinopy) (3.1.0)\n", + "Requirement already satisfied: idna<4,>=2.5 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from requests->infinopy) (3.4)\n", + "Requirement already satisfied: certifi>=2017.4.17 in /Users/vinaykakade/.pyenv/versions/3.10.11/lib/python3.10/site-packages (from requests->infinopy) (2023.5.7)\n" + ] + } + ], + "source": [ + "# Install necessary dependencies.\n", + "!pip install infinopy\n", + "!pip install matplotlib\n", + "\n", + "# Remove the (1) import sys and sys.path.append(..) and (2) uncomment `!pip install langchain` after merging the PR for Infino/LangChain integration.\n", + "import sys\n", + "sys.path.append(\"../../../../../langchain\")\n", + "#!pip install langchain\n", + "\n", + "\n", + "import datetime as dt\n", + "from infinopy import InfinoClient\n", + "import json\n", + "from langchain.llms import OpenAI\n", + "from langchain.callbacks import InfinoCallbackHandler\n", + "import matplotlib.pyplot as plt\n", + "import matplotlib.dates as md\n", + "import os\n", + "import time\n", + "import sys" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "9f90210d-c805-4a0c-81e4-d5298942afc4", + "metadata": {}, + "source": [ + "## Start Infino server, initialize the Infino client\n" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "id": "748b9858-5145-4351-976a-ca2d54e836a6", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "497a621125800abdd19f57ce7e033349b3cf83ca8cea6a74e8e28433a42ecadd\n" + ] + } + ], + "source": [ + "# Start server using the Infino docker image.\n", + "!docker run --rm --detach --name infino-example -p 3000:3000 infinohq/infino:latest\n", + "\n", + "# Create Infino client.\n", + "client = InfinoClient()" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "b6b81cda-b841-43ee-8c5e-b1576555765f", + "metadata": {}, + "source": [ + "## Read the questions dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "b659fd0c-0d8c-470e-8b6c-867a117f2a27", + "metadata": {}, + "outputs": [], + "source": [ + "# These are a subset of questions from Stanford's QA dataset - \n", + "# https://rajpurkar.github.io/SQuAD-explorer/\n", + "data = '''In what country is Normandy located?\n", + "When were the Normans in Normandy?\n", + "From which countries did the Norse originate?\n", + "Who was the Norse leader?\n", + "What century did the Normans first gain their separate identity?\n", + "Who gave their name to Normandy in the 1000's and 1100's\n", + "What is France a region of?\n", + "Who did King Charles III swear fealty to?\n", + "When did the Frankish identity emerge?\n", + "Who was the duke in the battle of Hastings?\n", + "Who ruled the duchy of Normandy\n", + "What religion were the Normans\n", + "What type of major impact did the Norman dynasty have on modern Europe?\n", + "Who was famed for their Christian spirit?\n", + "Who assimilted the Roman language?\n", + "Who ruled the country of Normandy?\n", + "What principality did William the conquerer found?\n", + "What is the original meaning of the word Norman?\n", + "When was the Latin version of the word Norman first recorded?\n", + "What name comes from the English words Normans/Normanz?'''\n", + "\n", + "questions = data.split('\\n')" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "dce1b820-3f1a-4b94-b848-4c6032cadc18", + "metadata": {}, + "source": [ + "## LangChain OpenAI Q&A; Publish metrics and logs to Infino" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "id": "d5cebf35-2d10-48b8-ab11-c4a574c595d2", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "In what country is Normandy located?\n", + "generations=[[Generation(text='\\n\\nNormandy is located in France.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 16, 'completion_tokens': 9, 'prompt_tokens': 7}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('8de21639-acec-4bd1-a12d-8124de1e20da'))\n", + "When were the Normans in Normandy?\n", + "generations=[[Generation(text='\\n\\nThe Normans first settled in Normandy in the late 9th century.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 24, 'completion_tokens': 16, 'prompt_tokens': 8}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('cf81fc86-250b-4e6e-9d92-2df3bebb019a'))\n", + "From which countries did the Norse originate?\n", + "generations=[[Generation(text='\\n\\nThe Norse originated from Scandinavia, which includes modern-day Norway, Sweden, and Denmark.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 29, 'completion_tokens': 21, 'prompt_tokens': 8}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('50f42f5e-b4a4-411a-a049-f92cb573a74f'))\n", + "Who was the Norse leader?\n", + "generations=[[Generation(text='\\n\\nThe most famous Norse leader was the legendary Viking king Ragnar Lodbrok. He is believed to have lived in the 9th century and is renowned for his exploits in England and France.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 45, 'completion_tokens': 39, 'prompt_tokens': 6}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('e32f31cb-ddc9-4863-8e6e-cb7a281a0ada'))\n", + "What century did the Normans first gain their separate identity?\n", + "generations=[[Generation(text='\\n\\nThe Normans first gained their separate identity in the 11th century.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 28, 'completion_tokens': 16, 'prompt_tokens': 12}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('da9d8f73-b3b3-4bc5-8495-da8b11462a51'))\n", + "Who gave their name to Normandy in the 1000's and 1100's\n", + "generations=[[Generation(text='\\n\\nThe Normans, a people from northern France, gave their name to Normandy in the 1000s and 1100s. The Normans were descended from Viking settlers who had come to the region in the late 800s.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 58, 'completion_tokens': 45, 'prompt_tokens': 13}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('bb5829bf-b6a6-4429-adfa-414ac5be46e5'))\n", + "What is France a region of?\n", + "generations=[[Generation(text='\\n\\nFrance is a region of Europe.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 16, 'completion_tokens': 9, 'prompt_tokens': 7}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('6943880b-b4e4-4c74-9ca1-8c03c10f7e9c'))\n", + "Who did King Charles III swear fealty to?\n", + "generations=[[Generation(text='\\n\\nKing Charles III swore fealty to Pope Innocent III.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 23, 'completion_tokens': 13, 'prompt_tokens': 10}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('c91fd663-09e6-4d00-b746-4c7fd96f9ceb'))\n", + "When did the Frankish identity emerge?\n", + "generations=[[Generation(text='\\n\\nThe Frankish identity began to emerge in the late 5th century, when the Franks began to expand their power and influence in the region. The Franks were a Germanic tribe that had migrated to the area from the east and had established a kingdom in what is now modern-day France. The Franks were eventually able to establish a powerful kingdom that lasted until the 10th century.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 86, 'completion_tokens': 78, 'prompt_tokens': 8}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('23f86775-e592-4cb8-baa3-46ebe74305b2'))\n", + "Who was the duke in the battle of Hastings?\n", + "generations=[[Generation(text='\\n\\nThe Duke of Normandy, William the Conqueror, was the leader of the Norman forces at the Battle of Hastings in 1066.', generation_info={'finish_reason': 'stop', 'logprobs': None})]] llm_output={'token_usage': {'total_tokens': 39, 'completion_tokens': 28, 'prompt_tokens': 11}, 'model_name': 'text-davinci-003'} run=RunInfo(run_id=UUID('ad5b7984-8758-4d95-a5eb-ee56e0218f6b'))\n" + ] + } + ], + "source": [ + "# Set your key here.\n", + "#os.environ[\"OPENAI_API_KEY\"] = \"YOUR_API_KEY\"\n", + "\n", + "# Create callback handler. This logs latency, errors, token usage, prompts as well as prompt responses to Infino.\n", + "handler = InfinoCallbackHandler(model_id=\"test_openai\", model_version=\"0.1\", verbose=False)\n", + "\n", + "# Create LLM.\n", + "llm = OpenAI(temperature=0.1)\n", + "\n", + "# Number of questions to ask the OpenAI model. We limit to a short number here to save $$ while running this demo.\n", + "num_questions = 10\n", + "\n", + "questions = questions[0:num_questions]\n", + "for question in questions:\n", + " print(question)\n", + "\n", + " # We send the question to OpenAI API, with Infino callback.\n", + " llm_result = llm.generate([question], callbacks=[handler])\n", + " print(llm_result)" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "b68ec697-c922-4fd9-aad1-f49c6ac24e8a", + "metadata": {}, + "source": [ + "## Create Metric Charts\n", + "\n", + "We now use matplotlib to create graphs of latency, errors and tokens consumed." + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "id": "f078c612-89e0-4a1d-b1a8-bf36b664a10e", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "image/png": "", + "text/plain": [ + "
" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "# Helper function to create a graph using matplotlib.\n", + "def plot(data, title):\n", + " data = json.loads(data)\n", + "\n", + " # Extract x and y values from the data\n", + " timestamps = [item[\"time\"] for item in data]\n", + " dates=[dt.datetime.fromtimestamp(ts) for ts in timestamps]\n", + " y = [item[\"value\"] for item in data]\n", + "\n", + " plt.rcParams['figure.figsize'] = [6, 4]\n", + " plt.subplots_adjust(bottom=0.2)\n", + " plt.xticks(rotation=25 )\n", + " ax=plt.gca()\n", + " xfmt = md.DateFormatter('%Y-%m-%d %H:%M:%S')\n", + " ax.xaxis.set_major_formatter(xfmt)\n", + " \n", + " # Create the plot\n", + " plt.plot(dates, y)\n", + "\n", + " # Set labels and title\n", + " plt.xlabel(\"Time\")\n", + " plt.ylabel(\"Value\")\n", + " plt.title(title)\n", + "\n", + " plt.show()\n", + "\n", + "response = client.search_ts(\"__name__\", \"latency\", 0, int(time.time()))\n", + "plot(response.text, \"Latency\")\n", + "\n", + "response = client.search_ts(\"__name__\", \"error\", 0, int(time.time()))\n", + "plot(response.text, \"Errors\")\n", + "\n", + "response = client.search_ts(\"__name__\", \"prompt_tokens\", 0, int(time.time()))\n", + "plot(response.text, \"Prompt Tokens\")\n", + "\n", + "response = client.search_ts(\"__name__\", \"completion_tokens\", 0, int(time.time()))\n", + "plot(response.text, \"Completion Tokens\")\n", + "\n", + "response = client.search_ts(\"__name__\", \"total_tokens\", 0, int(time.time()))\n", + "plot(response.text, \"Total Tokens\")\n" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "c3d61822-1781-4bc6-97a2-2abc5c2b2e75", + "metadata": {}, + "source": [ + "## Full text query on prompt or prompt outputs." + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "id": "a0f051f0-e2bc-44e7-8dfb-bfd5bbd0fc9f", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Results for normandy : [{\"time\":1686821979,\"fields\":{\"prompt\":\"In what country is Normandy located?\"},\"text\":\"In what country is Normandy located?\"},{\"time\":1686821982,\"fields\":{\"prompt_response\":\"\\n\\nNormandy is located in France.\"},\"text\":\"\\n\\nNormandy is located in France.\"},{\"time\":1686821984,\"fields\":{\"prompt_response\":\"\\n\\nThe Normans first settled in Normandy in the late 9th century.\"},\"text\":\"\\n\\nThe Normans first settled in Normandy in the late 9th century.\"},{\"time\":1686821993,\"fields\":{\"prompt\":\"Who gave their name to Normandy in the 1000's and 1100's\"},\"text\":\"Who gave their name to Normandy in the 1000's and 1100's\"},{\"time\":1686821997,\"fields\":{\"prompt_response\":\"\\n\\nThe Normans, a people from northern France, gave their name to Normandy in the 1000s and 1100s. The Normans were descended from Viking settlers who had come to the region in the late 800s.\"},\"text\":\"\\n\\nThe Normans, a people from northern France, gave their name to Normandy in the 1000s and 1100s. The Normans were descended from Viking settlers who had come to the region in the late 800s.\"}]\n", + "===\n", + "Results for king charles III : [{\"time\":1686821998,\"fields\":{\"prompt\":\"Who did King Charles III swear fealty to?\"},\"text\":\"Who did King Charles III swear fealty to?\"},{\"time\":1686822000,\"fields\":{\"prompt_response\":\"\\n\\nKing Charles III swore fealty to Pope Innocent III.\"},\"text\":\"\\n\\nKing Charles III swore fealty to Pope Innocent III.\"}]\n" + ] + } + ], + "source": [ + "# Search for a particular prompt text.\n", + "query = \"normandy\"\n", + "response = client.search_log(query, 0, int(time.time()))\n", + "print(\"Results for\", query, \":\", response.text)\n", + "\n", + "print(\"===\")\n", + "\n", + "query = \"king charles III\"\n", + "response = client.search_log(\"king charles III\", 0, int(time.time()))\n", + "print(\"Results for\", query, \":\", response.text)\n" + ] + }, + { + "attachments": {}, + "cell_type": "markdown", + "id": "4b171074-c775-48e0-a4b3-f550e2c8eccb", + "metadata": {}, + "source": [ + "## Step 5: Stop infino server" + ] + }, + { + "cell_type": "code", + "execution_count": 21, + "id": "147663cb-b88f-4cfb-9726-7231dbec7cc1", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "infino-example\n" + ] + } + ], + "source": [ + "!docker rm -f infino-example" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "id": "86f36c49-53a3-460d-b74b-995cda7726b3", + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.9.4" + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} diff --git a/langchain/callbacks/__init__.py b/langchain/callbacks/__init__.py index 082ef22c..985cf9c8 100644 --- a/langchain/callbacks/__init__.py +++ b/langchain/callbacks/__init__.py @@ -7,6 +7,7 @@ from langchain.callbacks.clearml_callback import ClearMLCallbackHandler from langchain.callbacks.comet_ml_callback import CometCallbackHandler from langchain.callbacks.file import FileCallbackHandler from langchain.callbacks.human import HumanApprovalCallbackHandler +from langchain.callbacks.infino_callback import InfinoCallbackHandler from langchain.callbacks.manager import ( get_openai_callback, tracing_enabled, @@ -36,6 +37,7 @@ __all__ = [ "FileCallbackHandler", "FinalStreamingStdOutCallbackHandler", "HumanApprovalCallbackHandler", + "InfinoCallbackHandler", "MlflowCallbackHandler", "OpenAICallbackHandler", "StdOutCallbackHandler", diff --git a/langchain/callbacks/infino_callback.py b/langchain/callbacks/infino_callback.py new file mode 100644 index 00000000..f8a01d65 --- /dev/null +++ b/langchain/callbacks/infino_callback.py @@ -0,0 +1,172 @@ +import time +from typing import Any, Dict, List, Optional, Union + +from langchain.callbacks.base import BaseCallbackHandler +from langchain.schema import AgentAction, AgentFinish, LLMResult + + +def import_infino() -> Any: + try: + from infinopy import InfinoClient + except ImportError: + raise ImportError( + "To use the Infino callbacks manager you need to have the" + " `infinopy` python package installed." + "Please install it with `pip install infinopy`" + ) + return InfinoClient() + + +class InfinoCallbackHandler(BaseCallbackHandler): + """Callback Handler that logs to Infino.""" + + def __init__( + self, + model_id: Optional[str] = None, + model_version: Optional[str] = None, + verbose: bool = False, + ) -> None: + # Set Infino client + self.client = import_infino() + self.model_id = model_id + self.model_version = model_version + self.verbose = verbose + + def _send_to_infino( + self, + key: str, + value: Any, + is_ts: bool = True, + ) -> None: + """Send the key-value to Infino. + + Parameters: + key (str): the key to send to Infino. + value (Any): the value to send to Infino. + is_ts (bool): if True, the value is part of a time series, else it + is sent as a log message. + """ + payload = { + "date": int(time.time()), + key: value, + "labels": { + "model_id": self.model_id, + "model_version": self.model_version, + }, + } + if self.verbose: + print(f"Tracking {key} with Infino: {payload}") + + # Append to Infino time series only if is_ts is True, otherwise + # append to Infino log. + if is_ts: + self.client.append_ts(payload) + else: + self.client.append_log(payload) + + def on_llm_start( + self, + serialized: Dict[str, Any], + prompts: List[str], + **kwargs: Any, + ) -> None: + """Log the prompts to Infino, and set start time and error flag.""" + for prompt in prompts: + self._send_to_infino("prompt", prompt, is_ts=False) + + # Set the error flag to indicate no error (this will get overridden + # in on_llm_error if an error occurs). + self.error = 0 + + # Set the start time (so that we can calculate the request + # duration in on_llm_end). + self.start_time = time.time() + + def on_llm_new_token(self, token: str, **kwargs: Any) -> None: + """Do nothing when a new token is generated.""" + pass + + def on_llm_end(self, response: LLMResult, **kwargs: Any) -> None: + """Log the latency, error, token usage, and response to Infino.""" + # Calculate and track the request latency. + self.end_time = time.time() + duration = self.end_time - self.start_time + self._send_to_infino("latency", duration) + + # Track success or error flag. + self._send_to_infino("error", self.error) + + # Track token usage. + if (response.llm_output is not None) and isinstance(response.llm_output, Dict): + token_usage = response.llm_output["token_usage"] + if token_usage is not None: + prompt_tokens = token_usage["prompt_tokens"] + total_tokens = token_usage["total_tokens"] + completion_tokens = token_usage["completion_tokens"] + self._send_to_infino("prompt_tokens", prompt_tokens) + self._send_to_infino("total_tokens", total_tokens) + self._send_to_infino("completion_tokens", completion_tokens) + + # Track prompt response. + for generations in response.generations: + for generation in generations: + self._send_to_infino("prompt_response", generation.text, is_ts=False) + + def on_llm_error( + self, error: Union[Exception, KeyboardInterrupt], **kwargs: Any + ) -> None: + """Set the error flag.""" + self.error = 1 + + def on_chain_start( + self, serialized: Dict[str, Any], inputs: Dict[str, Any], **kwargs: Any + ) -> None: + """Do nothing when LLM chain starts.""" + pass + + def on_chain_end(self, outputs: Dict[str, Any], **kwargs: Any) -> None: + """Do nothing when LLM chain ends.""" + pass + + def on_chain_error( + self, error: Union[Exception, KeyboardInterrupt], **kwargs: Any + ) -> None: + """Need to log the error.""" + pass + + def on_tool_start( + self, + serialized: Dict[str, Any], + input_str: str, + **kwargs: Any, + ) -> None: + """Do nothing when tool starts.""" + pass + + def on_agent_action(self, action: AgentAction, **kwargs: Any) -> Any: + """Do nothing when agent takes a specific action.""" + pass + + def on_tool_end( + self, + output: str, + observation_prefix: Optional[str] = None, + llm_prefix: Optional[str] = None, + **kwargs: Any, + ) -> None: + """Do nothing when tool ends.""" + pass + + def on_tool_error( + self, error: Union[Exception, KeyboardInterrupt], **kwargs: Any + ) -> None: + """Do nothing when tool outputs an error.""" + pass + + def on_text(self, text: str, **kwargs: Any) -> None: + """Do nothing.""" + pass + + def on_agent_finish(self, finish: AgentFinish, **kwargs: Any) -> None: + """Do nothing.""" + pass