initial commit

2 years ago · 18aeb72012
commit 18aeb72012
64 changed files with 1796 additions and 0 deletions
--- a/.flake8
+++ b/.flake8
@ -0,0 +1,11 @@
 [flake8]
 exclude =
    .venv
    __pycache__
    notebooks
 # Recommend matching the black line length (default 88),
 # rather than using the flake8 default of 79:
 max-line-length = 88
 extend-ignore =
    # See https://github.com/PyCQA/pycodestyle/issues/373
    E203,
--- a/.github/workflows/lint.yml
+++ b/.github/workflows/lint.yml
@ -0,0 +1,23 @@
 name: lint
 on: [push]
 jobs:
  build:
    runs-on: ubuntu-latest
    strategy:
      matrix:
        python-version: ["3.7"]
    steps:
    - uses: actions/checkout@v3
    - name: Set up Python ${{ matrix.python-version }}
      uses: actions/setup-python@v3
      with:
        python-version: ${{ matrix.python-version }}
    - name: Install dependencies
      run: |
        python -m pip install --upgrade pip
        pip install -r requirements.txt
    - name: Analysing the code with our lint
      run: |
        make lint
--- a/.github/workflows/test.yml
+++ b/.github/workflows/test.yml
@ -0,0 +1,23 @@
 name: test
 on: [push]
 jobs:
  build:
    runs-on: ubuntu-latest
    strategy:
      matrix:
        python-version: ["3.7"]
    steps:
    - uses: actions/checkout@v3
    - name: Set up Python ${{ matrix.python-version }}
      uses: actions/setup-python@v3
      with:
        python-version: ${{ matrix.python-version }}
    - name: Install dependencies
      run: |
        python -m pip install --upgrade pip
        pip install -r test_requirements.txt
    - name: Run unit tests
      run: |
        make tests
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,130 @@
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]
 *$py.class
 # C extensions
 *.so
 # Distribution / packaging
 .Python
 build/
 develop-eggs/
 dist/
 downloads/
 eggs/
 .eggs/
 lib/
 lib64/
 parts/
 sdist/
 var/
 wheels/
 pip-wheel-metadata/
 share/python-wheels/
 *.egg-info/
 .installed.cfg
 *.egg
 MANIFEST
 # PyInstaller
 #  Usually these files are written by a python script from a template
 #  before PyInstaller builds the exe, so as to inject date/other infos into it.
 *.manifest
 *.spec
 # Installer logs
 pip-log.txt
 pip-delete-this-directory.txt
 # Unit test / coverage reports
 htmlcov/
 .tox/
 .nox/
 .coverage
 .coverage.*
 .cache
 nosetests.xml
 coverage.xml
 *.cover
 *.py,cover
 .hypothesis/
 .pytest_cache/
 # Translations
 *.mo
 *.pot
 # Django stuff:
 *.log
 local_settings.py
 db.sqlite3
 db.sqlite3-journal
 # Flask stuff:
 instance/
 .webassets-cache
 # Scrapy stuff:
 .scrapy
 # Sphinx documentation
 docs/_build/
 # PyBuilder
 target/
 # Jupyter Notebook
 .ipynb_checkpoints
 notebooks/
 # IPython
 profile_default/
 ipython_config.py
 # pyenv
 .python-version
 # pipenv
 #   According to pypa/pipenv#598, it is recommended to include Pipfile.lock in version control.
 #   However, in case of collaboration, if having platform-specific dependencies or dependencies
 #   having no cross-platform support, pipenv may install dependencies that don't work, or not
 #   install all needed dependencies.
 #Pipfile.lock
 # PEP 582; used by e.g. github.com/David-OConnor/pyflow
 __pypackages__/
 # Celery stuff
 celerybeat-schedule
 celerybeat.pid
 # SageMath parsed files
 *.sage.py
 # Environments
 .env
 .venv
 env/
 venv/
 ENV/
 env.bak/
 venv.bak/
 # Spyder project settings
 .spyderproject
 .spyproject
 # Rope project settings
 .ropeproject
 # mkdocs documentation
 /site
 # mypy
 .mypy_cache/
 .dmypy.json
 dmypy.json
 # Pyre type checker
 .pyre/
--- a/MANIFEST.in
+++ b/MANIFEST.in
@ -0,0 +1,2 @@
 include langchain/VERSION
 include LICENSE
--- a/17
+++ b/17
@ -0,0 +1,17 @@
 .PHONY: format lint tests integration_tests
 format:
 	black .
 	isort .
 lint:
 	mypy .
 	black . --check
 	isort . --check
 	flake8 .
 tests:
 	pytest tests/unit_tests
 integration_tests:
 	pytest tests/integration_tests
--- a/README.md
+++ b/README.md
@ -0,0 +1,80 @@
 # 🦜️🔗 LangChain
 ⚡ Building applications with LLMs through composability ⚡
 [![lint](https://github.com/hwchase17/langchain/actions/workflows/lint.yml/badge.svg)](https://github.com/hwchase17/langchain/actions/workflows/lint.yml) [![test](https://github.com/hwchase17/langchain/actions/workflows/test.yml/badge.svg)](https://github.com/hwchase17/langchain/actions/workflows/test.yml) [![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 ## Quick Install
 `pip install langchain`
 ## 🤔 What is this?
 Large language models (LLMs) are emerging as a transformative technology, enabling
 developers to build applications that they previously could not.
 But using these LLMs in isolation is often not enough to
 create a truly powerful app - the real power comes when you are able to
 combine them with other sources of computation or knowledge.
 This library is aimed at assisting in the development of those types of applications.
 It aims to create:
 1. a comprehensive collection of pieces you would ever want to combine
 2. a flexible interface for combining pieces into a single comprehensive "chain"
 3. a schema for easily saving and sharing those chains
 ## 🚀 What can I do with this
 This project was largely inspired by a few projects seen on Twitter for which we thought it would make sense to have more explicit tooling. A lot of the initial functionality was done in an attempt to recreate those. Those are:
 **[Self-ask-with-search](https://ofir.io/self-ask.pdf)**
 To recreate this paper, use the following code snippet or checkout the [example notebook](https://github.com/hwchase17/langchain/blob/master/examples/self_ask_with_search.ipynb).
 ```
 from langchain import SelfAskWithSearchChain, OpenAI, SerpAPIChain
 llm = OpenAI(temperature=0)
 search = SerpAPIChain()
 self_ask_with_search = SelfAskWithSearchChain(llm=llm, search_chain=search)
 self_ask_with_search.run("What is the hometown of the reigning men's U.S. Open champion?")
 ```
 **[LLM Math](https://twitter.com/amasad/status/1568824744367259648?s=20&t=-7wxpXBJinPgDuyHLouP1w)**
 To recreate this example, use the following code snippet or check out the [example notebook](https://github.com/hwchase17/langchain/blob/master/examples/llm_math.ipynb).
 ```
 from langchain import OpenAI, LLMMathChain
 llm = OpenAI(temperature=0)
 llm_math = LLMMathChain(llm=llm)
 llm_math.run("How many of the integers between 0 and 99 inclusive are divisible by 8?")
 ```
 **Generic Prompting**
 You can also use this for simple prompting pipelines, as in the below example and this [example notebook](https://github.com/hwchase17/langchain/blob/master/examples/simple_prompts.ipynb).
 ```
 from langchain import Prompt, OpenAI, LLMChain
 template = """Question: {question}
 Answer: Let's think step by step."""
 prompt = Prompt(template=template, input_variables=["question"])
 llm_chain = LLMChain(prompt=prompt, llm=OpenAI(temperature=0))
 question = "What NFL team won the Super Bowl in the year Justin Beiber was born?"
 llm_chain.predict(question=question)
 ```
 ## 📖 Documentation
 The above examples are probably the most user friendly documentation that exists,
 but full API docs can be found [here](https://langchain.readthedocs.io/en/latest/?).
--- a/docs/Makefile
+++ b/docs/Makefile
@ -0,0 +1,21 @@
 # Minimal makefile for Sphinx documentation
 #
 # You can set these variables from the command line, and also
 # from the environment for the first two.
 SPHINXOPTS    ?=
 SPHINXBUILD   ?= sphinx-build
 SPHINXAUTOBUILD   ?= sphinx-autobuild
 SOURCEDIR     = .
 BUILDDIR      = _build
 # Put it first so that "make" without argument is like "make help".
 help:
 	@$(SPHINXBUILD) -M help "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
 .PHONY: help Makefile
 # Catch-all target: route all unknown targets to Sphinx using the new
 # "make mode" option.  $(O) is meant as a shortcut for $(SPHINXOPTS).
 %: Makefile
 	@$(SPHINXBUILD) -M $@ "$(SOURCEDIR)" "$(BUILDDIR)" $(SPHINXOPTS) $(O)
--- a/docs/conf.py
+++ b/docs/conf.py
@ -0,0 +1,65 @@
 """Configuration file for the Sphinx documentation builder."""
 # Configuration file for the Sphinx documentation builder.
 #
 # This file only contains a selection of the most common options. For a full
 # list see the documentation:
 # https://www.sphinx-doc.org/en/master/usage/configuration.html
 # -- Path setup --------------------------------------------------------------
 # If extensions (or modules to document with autodoc) are in another directory,
 # add these directories to sys.path here. If the directory is relative to the
 # documentation root, use os.path.abspath to make it absolute, like shown here.
 #
 # import os
 # import sys
 # sys.path.insert(0, os.path.abspath('.'))
 import langchain
 # -- Project information -----------------------------------------------------
 project = "LangChain"
 copyright = "2022, Harrison Chase"
 author = "Harrison Chase"
 version = langchain.__version__
 release = langchain.__version__
 # -- General configuration ---------------------------------------------------
 # Add any Sphinx extension module names here, as strings. They can be
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 # ones.
 extensions = [
    "sphinx.ext.autodoc",
    "sphinx.ext.autodoc.typehints",
    "sphinx.ext.autosummary",
    "sphinx.ext.napoleon",
 ]
 # autodoc_typehints = "signature"
 autodoc_typehints = "description"
 # Add any paths that contain templates here, relative to this directory.
 templates_path = ["_templates"]
 # List of patterns, relative to source directory, that match files and
 # directories to ignore when looking for source files.
 # This pattern also affects html_static_path and html_extra_path.
 exclude_patterns = ["_build", "Thumbs.db", ".DS_Store"]
 # -- Options for HTML output -------------------------------------------------
 # The theme to use for HTML and HTML Help pages.  See the documentation for
 # a list of builtin themes.
 #
 html_theme = "sphinx_rtd_theme"
 # html_theme = "sphinx_typlog_theme"
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
 # so a file named "default.css" will overwrite the builtin "default.css".
 html_static_path = ["_static"]
--- a/docs/index.rst
+++ b/docs/index.rst
@ -0,0 +1,10 @@
 Welcome to LangChain
 ==========================
 .. toctree::
   :maxdepth: 2
   :caption: User API
   modules/prompt
   modules/llms
   modules/chains
--- a/docs/make.bat
+++ b/docs/make.bat
@ -0,0 +1,35 @@
@ECHO OFF
 pushd %~dp0
 REM Command file for Sphinx documentation
 if "%SPHINXBUILD%" == "" (
 	set SPHINXBUILD=sphinx-build
 )
 set SOURCEDIR=.
 set BUILDDIR=_build
 if "%1" == "" goto help
 %SPHINXBUILD% >NUL 2>NUL
 if errorlevel 9009 (
 	echo.
 	echo.The 'sphinx-build' command was not found. Make sure you have Sphinx
 	echo.installed, then set the SPHINXBUILD environment variable to point
 	echo.to the full path of the 'sphinx-build' executable. Alternatively you
 	echo.may add the Sphinx directory to PATH.
 	echo.
 	echo.If you don't have Sphinx installed, grab it from
 	echo.http://sphinx-doc.org/
 	exit /b 1
 )
 %SPHINXBUILD% -M %1 %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
 goto end
 :help
 %SPHINXBUILD% -M help %SOURCEDIR% %BUILDDIR% %SPHINXOPTS% %O%
 :end
 popd
--- a/docs/modules/chains.rst
+++ b/docs/modules/chains.rst
@ -0,0 +1,7 @@
 :mod:`langchain.chains`
 =======================
 .. automodule:: langchain.chains
   :members:
   :undoc-members:
--- a/docs/modules/llms.rst
+++ b/docs/modules/llms.rst
@ -0,0 +1,6 @@
 :mod:`langchain.llms`
 =======================
 .. automodule:: langchain.llms
   :members:
   :undoc-members:
--- a/docs/modules/prompt.rst
+++ b/docs/modules/prompt.rst
@ -0,0 +1,6 @@
 :mod:`langchain.prompt`
 =======================
 .. automodule:: langchain.prompt
   :members:
   :undoc-members:
--- a/docs/requirements.txt
+++ b/docs/requirements.txt
@ -0,0 +1,4 @@
 sphinx==4.5.0
 sphinx-autobuild==2021.3.14
 sphinx_rtd_theme==1.0.0
 sphinx-typlog-theme==0.8.0
--- a/examples/llm_math.ipynb
+++ b/examples/llm_math.ipynb
@ -0,0 +1,59 @@
 {
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "44e9ba31",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'Answer: 13\\n'"
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from langchain import OpenAI, LLMMathChain\n",
    "\n",
    "llm = OpenAI(temperature=0)\n",
    "llm_math = LLMMathChain(llm=llm)\n",
    "\n",
    "llm_math.run(\"How many of the integers between 0 and 99 inclusive are divisible by 8?\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "f62f0c75",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
 }
--- a/examples/self_ask_with_search.ipynb
+++ b/examples/self_ask_with_search.ipynb
@ -0,0 +1,74 @@
 {
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "7e3b513e",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "What is the hometown of the reigning men's U.S. Open champion?\n",
      "Are follow up questions needed here:\u001b[102m Yes.\n",
      "Follow up: Who is the reigning men's U.S. Open champion?\u001b[0m\n",
      "Intermediate answer: \u001b[106mCarlos Alcaraz\u001b[0m.\u001b[102m\n",
      "Follow up: Where is Carlos Alcaraz from?\u001b[0m\n",
      "Intermediate answer: \u001b[106mEl Palmar, Murcia, Spain\u001b[0m.\u001b[102m\n",
      "So the final answer is: El Palmar, Murcia, Spain\u001b[0m"
     ]
    },
    {
     "data": {
      "text/plain": [
       "\"What is the hometown of the reigning men's U.S. Open champion?\\nAre follow up questions needed here: Yes.\\nFollow up: Who is the reigning men's U.S. Open champion?\\nIntermediate answer: Carlos Alcaraz.\\nFollow up: Where is Carlos Alcaraz from?\\nIntermediate answer: El Palmar, Murcia, Spain.\\nSo the final answer is: El Palmar, Murcia, Spain\""
      ]
     },
     "execution_count": 1,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from langchain import SelfAskWithSearchChain, OpenAI, SerpAPIChain\n",
    "\n",
    "llm = OpenAI(temperature=0)\n",
    "search = SerpAPIChain()\n",
    "\n",
    "self_ask_with_search = SelfAskWithSearchChain(llm=llm, search_chain=search)\n",
    "\n",
    "self_ask_with_search.run(\"What is the hometown of the reigning men's U.S. Open champion?\")"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "6195fc82",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
 }
--- a/examples/simple_prompts.ipynb
+++ b/examples/simple_prompts.ipynb
@ -0,0 +1,64 @@
 {
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "51a54c4d",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "' The year Justin Beiber was born was 1994. In 1994, the Dallas Cowboys won the Super Bowl.'"
      ]
     },
     "execution_count": 7,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "from langchain import Prompt, OpenAI, LLMChain\n",
    "\n",
    "template = \"\"\"Question: {question}\n",
    "\n",
    "Answer: Let's think step by step.\"\"\"\n",
    "prompt = Prompt(template=template, input_variables=[\"question\"])\n",
    "llm_chain = LLMChain(prompt=prompt, llm=OpenAI(temperature=0))\n",
    "\n",
    "question = \"What NFL team won the Super Bowl in the year Justin Beiber was born?\"\n",
    "\n",
    "llm_chain.predict(question=question)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "03dd6918",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3 (ipykernel)",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.7.6"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
 }
--- a/langchain/VERSION
+++ b/langchain/VERSION
@ -0,0 +1 @@
 0.0.1
--- a/langchain/init.py
+++ b/langchain/init.py
@ -0,0 +1,27 @@
 """Main entrypoint into package."""
 from pathlib import Path
 with open(Path(__file__).absolute().parents[0] / "VERSION") as _f:
    __version__ = _f.read().strip()
 from langchain.chains import (
    LLMChain,
    LLMMathChain,
    PythonChain,
    SelfAskWithSearchChain,
    SerpAPIChain,
 )
 from langchain.llms import Cohere, OpenAI
 from langchain.prompt import Prompt
 __all__ = [
    "LLMChain",
    "LLMMathChain",
    "PythonChain",
    "SelfAskWithSearchChain",
    "SerpAPIChain",
    "Cohere",
    "OpenAI",
    "Prompt",
 ]
--- a/langchain/chains/init.py
+++ b/langchain/chains/init.py
@ -0,0 +1,14 @@
 """Chains are easily reusable components which can be linked together."""
 from langchain.chains.llm import LLMChain
 from langchain.chains.llm_math.base import LLMMathChain
 from langchain.chains.python import PythonChain
 from langchain.chains.self_ask_with_search.base import SelfAskWithSearchChain
 from langchain.chains.serpapi import SerpAPIChain
 __all__ = [
    "LLMChain",
    "LLMMathChain",
    "PythonChain",
    "SelfAskWithSearchChain",
    "SerpAPIChain",
 ]
--- a/langchain/chains/base.py
+++ b/langchain/chains/base.py
@ -0,0 +1,41 @@
 """Base interface that all chains should implement."""
 from abc import ABC, abstractmethod
 from typing import Any, Dict, List
 class Chain(ABC):
    """Base interface that all chains should implement."""
    @property
    @abstractmethod
    def input_keys(self) -> List[str]:
        """Input keys this chain expects."""
    @property
    @abstractmethod
    def output_keys(self) -> List[str]:
        """Output keys this chain expects."""
    def _validate_inputs(self, inputs: Dict[str, str]) -> None:
        """Check that all inputs are present."""
        missing_keys = set(self.input_keys).difference(inputs)
        if missing_keys:
            raise ValueError(f"Missing some input keys: {missing_keys}")
    def _validate_outputs(self, outputs: Dict[str, str]) -> None:
        if set(outputs) != set(self.output_keys):
            raise ValueError(
                f"Did not get output keys that were expected. "
                f"Got: {set(outputs)}. Expected: {set(self.output_keys)}."
            )
    @abstractmethod
    def _run(self, inputs: Dict[str, str]) -> Dict[str, str]:
        """Run the logic of this chain and return the output."""
    def __call__(self, inputs: Dict[str, Any]) -> Dict[str, str]:
        """Run the logic of this chain and add to output."""
        self._validate_inputs(inputs)
        outputs = self._run(inputs)
        self._validate_outputs(outputs)
        return {**inputs, **outputs}
--- a/langchain/chains/llm.py
+++ b/langchain/chains/llm.py
@ -0,0 +1,46 @@
 """Chain that just formats a prompt and calls an LLM."""
 from typing import Any, Dict, List
 from pydantic import BaseModel, Extra
 from langchain.chains.base import Chain
 from langchain.llms.base import LLM
 from langchain.prompt import Prompt
 class LLMChain(Chain, BaseModel):
    """Chain to run queries against LLMs."""
    prompt: Prompt
    llm: LLM
    output_key: str = "text"
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
        arbitrary_types_allowed = True
    @property
    def input_keys(self) -> List[str]:
        """Will be whatever keys the prompt expects."""
        return self.prompt.input_variables
    @property
    def output_keys(self) -> List[str]:
        """Will always return text key."""
        return [self.output_key]
    def _run(self, inputs: Dict[str, Any]) -> Dict[str, str]:
        selected_inputs = {k: inputs[k] for k in self.prompt.input_variables}
        prompt = self.prompt.format(**selected_inputs)
        kwargs = {}
        if "stop" in inputs:
            kwargs["stop"] = inputs["stop"]
        response = self.llm(prompt, **kwargs)
        return {self.output_key: response}
    def predict(self, **kwargs: Any) -> str:
        """More user-friendly interface for interacting with LLMs."""
        return self(kwargs)[self.output_key]
--- a/langchain/chains/llm_math/init.py
+++ b/langchain/chains/llm_math/init.py
@ -0,0 +1,4 @@
 """Chain that interprets a prompt and executes python code to do math.
 Heavily borrowed from https://replit.com/@amasad/gptpy?v=1#main.py
 """
--- a/langchain/chains/llm_math/base.py
+++ b/langchain/chains/llm_math/base.py
@ -0,0 +1,57 @@
 """Chain that interprets a prompt and executes python code to do math."""
 from typing import Dict, List
 from pydantic import BaseModel, Extra
 from langchain.chains.base import Chain
 from langchain.chains.llm import LLMChain
 from langchain.chains.llm_math.prompt import PROMPT
 from langchain.chains.python import PythonChain
 from langchain.llms.base import LLM
 class LLMMathChain(Chain, BaseModel):
    """Chain that interprets a prompt and executes python code to do math."""
    llm: LLM
    verbose: bool = False
    input_key: str = "question"
    output_key: str = "answer"
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
        arbitrary_types_allowed = True
    @property
    def input_keys(self) -> List[str]:
        """Expect input key."""
        return [self.input_key]
    @property
    def output_keys(self) -> List[str]:
        """Expect output key."""
        return [self.output_key]
    def _run(self, inputs: Dict[str, str]) -> Dict[str, str]:
        llm_executor = LLMChain(prompt=PROMPT, llm=self.llm)
        python_executor = PythonChain()
        question = inputs[self.input_key]
        t = llm_executor.predict(question=question, stop=["```output"]).strip()
        if t.startswith("```python"):
            code = t[9:-4]
            if self.verbose:
                print("[DEBUG] evaluating code")
                print(code)
            output = python_executor.run(code)
            answer = "Answer: " + output
        elif t.startswith("Answer:"):
            answer = t
        else:
            raise ValueError(f"unknown format from LLM: {t}")
        return {self.output_key: answer}
    def run(self, question: str) -> str:
        """More user-friendly interface for interfacing with LLM math."""
        return self({self.input_key: question})[self.output_key]
--- a/langchain/chains/llm_math/prompt.py
+++ b/langchain/chains/llm_math/prompt.py
@ -0,0 +1,38 @@
 # flake8: noqa
 from langchain.prompt import Prompt
 _PROMPT_TEMPLATE = """You are GPT-3, and you can't do math.
 You can do basic math, and your memorization abilities are impressive, but you can't do any complex calculations that a human could not do in their head. You also have an annoying tendency to just make up highly specific, but wrong, answers.
 So we hooked you up to a Python 3 kernel, and now you can execute code. If anyone gives you a hard math problem, just use this format and we’ll take care of the rest:
 Question: ${{Question with hard calculation.}}
 ```python
 ${{Code that prints what you need to know}}
 ```
 ```output
 ${{Output of your code}}
 ```
 Answer: ${{Answer}}
 Otherwise, use this simpler format:
 Question: ${{Question without hard calculation}}
 Answer: ${{Answer}}
 Begin.
 Question: What is 37593 * 67?
 ```python
 print(37593 * 67)
 ```
 ```output
 2518731
 ```
 Answer: 2518731
 Question: {question}"""
 PROMPT = Prompt(input_variables=["question"], template=_PROMPT_TEMPLATE)
--- a/langchain/chains/python.py
+++ b/langchain/chains/python.py
@ -0,0 +1,40 @@
 """Chain that runs python code.
 Heavily borrowed from https://replit.com/@amasad/gptpy?v=1#main.py
 """
 import sys
 from io import StringIO
 from typing import Dict, List
 from pydantic import BaseModel
 from langchain.chains.base import Chain
 class PythonChain(Chain, BaseModel):
    """Chain to run python code."""
    input_key: str = "code"
    output_key: str = "output"
    @property
    def input_keys(self) -> List[str]:
        """Expect input key."""
        return [self.input_key]
    @property
    def output_keys(self) -> List[str]:
        """Return output key."""
        return [self.output_key]
    def _run(self, inputs: Dict[str, str]) -> Dict[str, str]:
        old_stdout = sys.stdout
        sys.stdout = mystdout = StringIO()
        exec(inputs[self.input_key])
        sys.stdout = old_stdout
        output = mystdout.getvalue()
        return {self.output_key: output}
    def run(self, code: str) -> str:
        """More user-friendly interface for interfacing with python."""
        return self({self.input_key: code})[self.output_key]
--- a/langchain/chains/self_ask_with_search/init.py
+++ b/langchain/chains/self_ask_with_search/init.py
@ -0,0 +1,4 @@
 """Chain that does self ask with search.
 Heavily borrowed from https://github.com/ofirpress/self-ask
 """
--- a/langchain/chains/self_ask_with_search/base.py
+++ b/langchain/chains/self_ask_with_search/base.py
@ -0,0 +1,142 @@
 """Chain that does self ask with search."""
 from typing import Any, Dict, List
 from pydantic import BaseModel, Extra
 from langchain.chains.base import Chain
 from langchain.chains.llm import LLMChain
 from langchain.chains.self_ask_with_search.prompt import PROMPT
 from langchain.chains.serpapi import SerpAPIChain
 from langchain.llms.base import LLM
 def extract_answer(generated: str) -> str:
    """Extract answer from text."""
    if "\n" not in generated:
        last_line = generated
    else:
        last_line = generated.split("\n")[-1]
    if ":" not in last_line:
        after_colon = last_line
    else:
        after_colon = generated.split(":")[-1]
    if " " == after_colon[0]:
        after_colon = after_colon[1:]
    if "." == after_colon[-1]:
        after_colon = after_colon[:-1]
    return after_colon
 def extract_question(generated: str, followup: str) -> str:
    """Extract question from text."""
    if "\n" not in generated:
        last_line = generated
    else:
        last_line = generated.split("\n")[-1]
    if followup not in last_line:
        print("we probably should never get here..." + generated)
    if ":" not in last_line:
        after_colon = last_line
    else:
        after_colon = generated.split(":")[-1]
    if " " == after_colon[0]:
        after_colon = after_colon[1:]
    if "?" != after_colon[-1]:
        print("we probably should never get here..." + generated)
    return after_colon
 def get_last_line(generated: str) -> str:
    """Get the last line in text."""
    if "\n" not in generated:
        last_line = generated
    else:
        last_line = generated.split("\n")[-1]
    return last_line
 def greenify(_input: str) -> str:
    """Add green highlighting to text."""
    return "\x1b[102m" + _input + "\x1b[0m"
 def yellowfy(_input: str) -> str:
    """Add yellow highlighting to text."""
    return "\x1b[106m" + _input + "\x1b[0m"
 class SelfAskWithSearchChain(Chain, BaseModel):
    """Chain that does self ask with search."""
    llm: LLM
    search_chain: SerpAPIChain
    input_key: str = "question"
    output_key: str = "answer"
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
        arbitrary_types_allowed = True
    @property
    def input_keys(self) -> List[str]:
        """Expect input key."""
        return [self.input_key]
    @property
    def output_keys(self) -> List[str]:
        """Expect output key."""
        return [self.output_key]
    def _run(self, inputs: Dict[str, Any]) -> Dict[str, str]:
        question = inputs[self.input_key]
        llm_chain = LLMChain(llm=self.llm, prompt=PROMPT)
        intermediate = "\nIntermediate answer:"
        followup = "Follow up:"
        finalans = "\nSo the final answer is:"
        cur_prompt = f"{question}\nAre follow up questions needed here:"
        print(cur_prompt, end="")
        ret_text = llm_chain.predict(input=cur_prompt, stop=[intermediate])
        print(greenify(ret_text), end="")
        while followup in get_last_line(ret_text):
            cur_prompt += ret_text
            question = extract_question(ret_text, followup)
            external_answer = self.search_chain.search(question)
            if external_answer is not None:
                cur_prompt += intermediate + " " + external_answer + "."
                print(
                    intermediate + " " + yellowfy(external_answer) + ".",
                    end="",
                )
                ret_text = llm_chain.predict(
                    input=cur_prompt, stop=["\nIntermediate answer:"]
                )
                print(greenify(ret_text), end="")
            else:
                # We only get here in the very rare case that Google returns no answer.
                cur_prompt += intermediate
                print(intermediate + " ")
                cur_prompt += llm_chain.predict(
                    input=cur_prompt, stop=["\n" + followup, finalans]
                )
        if finalans not in ret_text:
            cur_prompt += finalans
            print(finalans, end="")
            ret_text = llm_chain.predict(input=cur_prompt, stop=["\n"])
            print(greenify(ret_text), end="")
        return {self.output_key: cur_prompt + ret_text}
    def run(self, question: str) -> str:
        """More user-friendly interface for interfacing with self ask with search."""
        return self({self.input_key: question})[self.output_key]
--- a/langchain/chains/self_ask_with_search/prompt.py
+++ b/langchain/chains/self_ask_with_search/prompt.py
@ -0,0 +1,44 @@
 # flake8: noqa
 from langchain.prompt import Prompt
 _DEFAULT_TEMPLATE = """Question: Who lived longer, Muhammad Ali or Alan Turing?
 Are follow up questions needed here: Yes.
 Follow up: How old was Muhammad Ali when he died?
 Intermediate answer: Muhammad Ali was 74 years old when he died.
 Follow up: How old was Alan Turing when he died?
 Intermediate answer: Alan Turing was 41 years old when he died.
 So the final answer is: Muhammad Ali
 Question: When was the founder of craigslist born?
 Are follow up questions needed here: Yes.
 Follow up: Who was the founder of craigslist?
 Intermediate answer: Craigslist was founded by Craig Newmark.
 Follow up: When was Craig Newmark born?
 Intermediate answer: Craig Newmark was born on December 6, 1952.
 So the final answer is: December 6, 1952
 Question: Who was the maternal grandfather of George Washington?
 Are follow up questions needed here: Yes.
 Follow up: Who was the mother of George Washington?
 Intermediate answer: The mother of George Washington was Mary Ball Washington.
 Follow up: Who was the father of Mary Ball Washington?
 Intermediate answer: The father of Mary Ball Washington was Joseph Ball.
 So the final answer is: Joseph Ball
 Question: Are both the directors of Jaws and Casino Royale from the same country?
 Are follow up questions needed here: Yes.
 Follow up: Who is the director of Jaws?
 Intermediate Answer: The director of Jaws is Steven Spielberg.
 Follow up: Where is Steven Spielberg from?
 Intermediate Answer: The United States.
 Follow up: Who is the director of Casino Royale?
 Intermediate Answer: The director of Casino Royale is Martin Campbell.
 Follow up: Where is Martin Campbell from?
 Intermediate Answer: New Zealand.
 So the final answer is: No
 Question: {input}"""
 PROMPT = Prompt(
    input_variables=["input"],
    template=_DEFAULT_TEMPLATE,
 )
--- a/langchain/chains/serpapi.py
+++ b/langchain/chains/serpapi.py
@ -0,0 +1,99 @@
 """Chain that calls SerpAPI.
 Heavily borrowed from https://github.com/ofirpress/self-ask
 """
 import os
 import sys
 from typing import Any, Dict, List
 from pydantic import BaseModel, Extra, root_validator
 from langchain.chains.base import Chain
 class HiddenPrints:
    """Context manager to hide prints."""
    def __enter__(self) -> None:
        """Open file to pipe stdout to."""
        self._original_stdout = sys.stdout
        sys.stdout = open(os.devnull, "w")
    def __exit__(self, *_: Any) -> None:
        """Close file that stdout was piped to."""
        sys.stdout.close()
        sys.stdout = self._original_stdout
 class SerpAPIChain(Chain, BaseModel):
    """Chain that calls SerpAPI."""
    search_engine: Any
    input_key: str = "search_query"
    output_key: str = "search_result"
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
    @property
    def input_keys(self) -> List[str]:
        """Return the singular input key."""
        return [self.input_key]
    @property
    def output_keys(self) -> List[str]:
        """Return the singular output key."""
        return [self.output_key]
    @root_validator()
    def validate_environment(cls, values: Dict) -> Dict:
        """Validate that api key and python package exists in environment."""
        if "SERPAPI_API_KEY" not in os.environ:
            raise ValueError(
                "Did not find SerpAPI API key, please add an environment variable"
                " `SERPAPI_API_KEY` which contains it."
            )
        try:
            from serpapi import GoogleSearch
            values["search_engine"] = GoogleSearch
        except ImportError:
            raise ValueError(
                "Could not import serpapi python package. "
                "Please it install it with `pip install google-search-results`."
            )
        return values
    def _run(self, inputs: Dict[str, Any]) -> Dict[str, str]:
        params = {
            "api_key": os.environ["SERPAPI_API_KEY"],
            "engine": "google",
            "q": inputs[self.input_key],
            "google_domain": "google.com",
            "gl": "us",
            "hl": "en",
        }
        with HiddenPrints():
            search = self.search_engine(params)
            res = search.get_dict()
        if "answer_box" in res.keys() and "answer" in res["answer_box"].keys():
            toret = res["answer_box"]["answer"]
        elif "answer_box" in res.keys() and "snippet" in res["answer_box"].keys():
            toret = res["answer_box"]["snippet"]
        elif (
            "answer_box" in res.keys()
            and "snippet_highlighted_words" in res["answer_box"].keys()
        ):
            toret = res["answer_box"]["snippet_highlighted_words"][0]
        elif "snippet" in res["organic_results"][0].keys():
            toret = res["organic_results"][0]["snippet"]
        else:
            toret = None
        return {self.output_key: toret}
    def search(self, search_question: str) -> str:
        """More user-friendly interface for interfacing with search."""
        return self({self.input_key: search_question})[self.output_key]
--- a/langchain/formatting.py
+++ b/langchain/formatting.py
@ -0,0 +1,32 @@
 """Utilities for formatting strings."""
 from string import Formatter
 from typing import Any, Mapping, Sequence, Union
 class StrictFormatter(Formatter):
    """A subclass of formatter that checks for extra keys."""
    def check_unused_args(
        self,
        used_args: Sequence[Union[int, str]],
        args: Sequence,
        kwargs: Mapping[str, Any],
    ) -> None:
        """Check to see if extra parameters are passed."""
        extra = set(kwargs).difference(used_args)
        if extra:
            raise KeyError(extra)
    def vformat(
        self, format_string: str, args: Sequence, kwargs: Mapping[str, Any]
    ) -> str:
        """Check that no arguments are provided."""
        if len(args) > 0:
            raise ValueError(
                "No arguments should be provided, "
                "everything should be passed as keyword arguments."
            )
        return super().vformat(format_string, args, kwargs)
 formatter = StrictFormatter()
--- a/langchain/llms/init.py
+++ b/langchain/llms/init.py
@ -0,0 +1,5 @@
 """Wrappers on top of large language models."""
 from langchain.llms.cohere import Cohere
 from langchain.llms.openai import OpenAI
 __all__ = ["Cohere", "OpenAI"]
--- a/langchain/llms/base.py
+++ b/langchain/llms/base.py
@ -0,0 +1,11 @@
 """Base interface for large language models to expose."""
 from abc import ABC, abstractmethod
 from typing import List, Optional
 class LLM(ABC):
    """LLM wrapper should take in a prompt and return a string."""
    @abstractmethod
    def __call__(self, prompt: str, stop: Optional[List[str]] = None) -> str:
        """Run the LLM on the given prompt and input."""
--- a/langchain/llms/cohere.py
+++ b/langchain/llms/cohere.py
@ -0,0 +1,72 @@
 """Wrapper around Cohere APIs."""
 import os
 from typing import Any, Dict, List, Optional
 from pydantic import BaseModel, Extra, root_validator
 from langchain.llms.base import LLM
 def remove_stop_tokens(text: str, stop: List[str]) -> str:
    """Remove stop tokens, should they occur at end."""
    for s in stop:
        if text.endswith(s):
            return text[: -len(s)]
    return text
 class Cohere(BaseModel, LLM):
    """Wrapper around Cohere large language models."""
    client: Any
    model: str = "gptd-instruct-tft"
    max_tokens: int = 256
    temperature: float = 0.6
    k: int = 0
    p: int = 1
    frequency_penalty: int = 0
    presence_penalty: int = 0
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
    @root_validator()
    def template_is_valid(cls, values: Dict) -> Dict:
        """Validate that api key and python package exists in environment."""
        if "COHERE_API_KEY" not in os.environ:
            raise ValueError(
                "Did not find Cohere API key, please add an environment variable"
                " `COHERE_API_KEY` which contains it."
            )
        try:
            import cohere
            values["client"] = cohere.Client(os.environ["COHERE_API_KEY"])
        except ImportError:
            raise ValueError(
                "Could not import cohere python package. "
                "Please it install it with `pip install cohere`."
            )
        return values
    def __call__(self, prompt: str, stop: Optional[List[str]] = None) -> str:
        """Call out to Cohere's generate endpoint."""
        response = self.client.generate(
            model=self.model,
            prompt=prompt,
            max_tokens=self.max_tokens,
            temperature=self.temperature,
            k=self.k,
            p=self.p,
            frequency_penalty=self.frequency_penalty,
            presence_penalty=self.presence_penalty,
            stop_sequences=stop,
        )
        text = response.generations[0].text
        # If stop tokens are provided, Cohere's endpoint returns them.
        # In order to make this consistent with other endpoints, we strip them.
        if stop is not None:
            text = remove_stop_tokens(text, stop)
        return text
--- a/langchain/llms/openai.py
+++ b/langchain/llms/openai.py
@ -0,0 +1,65 @@
 """Wrapper around OpenAI APIs."""
 import os
 from typing import Any, Dict, List, Mapping, Optional
 from pydantic import BaseModel, Extra, root_validator
 from langchain.llms.base import LLM
 class OpenAI(BaseModel, LLM):
    """Wrapper around OpenAI large language models."""
    client: Any
    model_name: str = "text-davinci-002"
    temperature: float = 0.7
    max_tokens: int = 256
    top_p: int = 1
    frequency_penalty: int = 0
    presence_penalty: int = 0
    n: int = 1
    best_of: int = 1
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
    @root_validator()
    def validate_environment(cls, values: Dict) -> Dict:
        """Validate that api key and python package exists in environment."""
        if "OPENAI_API_KEY" not in os.environ:
            raise ValueError(
                "Did not find OpenAI API key, please add an environment variable"
                " `OPENAI_API_KEY` which contains it."
            )
        try:
            import openai
            values["client"] = openai.Completion
        except ImportError:
            raise ValueError(
                "Could not import openai python package. "
                "Please it install it with `pip install openai`."
            )
        return values
    @property
    def default_params(self) -> Mapping[str, Any]:
        """Get the default parameters for calling OpenAI API."""
        return {
            "temperature": self.temperature,
            "max_tokens": self.max_tokens,
            "top_p": self.top_p,
            "frequency_penalty": self.frequency_penalty,
            "presence_penalty": self.presence_penalty,
            "n": self.n,
            "best_of": self.best_of,
        }
    def __call__(self, prompt: str, stop: Optional[List[str]] = None) -> str:
        """Call out to OpenAI's create endpoint."""
        response = self.client.create(
            model=self.model_name, prompt=prompt, stop=stop, **self.default_params
        )
        return response["choices"][0]["text"]
--- a/langchain/prompt.py
+++ b/langchain/prompt.py
@ -0,0 +1,47 @@
 """Prompt schema definition."""
 from typing import Any, Dict, List
 from pydantic import BaseModel, Extra, root_validator
 from langchain.formatting import formatter
 _FORMATTER_MAPPING = {
    "f-string": formatter.format,
 }
 class Prompt(BaseModel):
    """Schema to represent a prompt for an LLM."""
    input_variables: List[str]
    template: str
    template_format: str = "f-string"
    class Config:
        """Configuration for this pydantic object."""
        extra = Extra.forbid
    def format(self, **kwargs: Any) -> str:
        """Format the prompt with the inputs."""
        return _FORMATTER_MAPPING[self.template_format](self.template, **kwargs)
    @root_validator()
    def template_is_valid(cls, values: Dict) -> Dict:
        """Check that template and input variables are consistent."""
        input_variables = values["input_variables"]
        template = values["template"]
        template_format = values["template_format"]
        if template_format not in _FORMATTER_MAPPING:
            valid_formats = list(_FORMATTER_MAPPING)
            raise ValueError(
                f"Invalid template format. Got `{template_format}`;"
                f" should be one of {valid_formats}"
            )
        dummy_inputs = {input_variable: "foo" for input_variable in input_variables}
        try:
            formatter_func = _FORMATTER_MAPPING[template_format]
            formatter_func(template, **dummy_inputs)
        except KeyError:
            raise ValueError("Invalid prompt schema.")
        return values
--- a/pyproject.toml
+++ b/pyproject.toml
@ -0,0 +1,7 @@
 [tool.isort]
 profile = "black"
 [tool.mypy]
 ignore_missing_imports = "True"
 disallow_untyped_defs = "True"
 exclude = ["notebooks"]
--- a/readthedocs.yml
+++ b/readthedocs.yml
@ -0,0 +1,10 @@
 version: 2
 sphinx:
  configuration: docs/conf.py
 formats: all
 python:
  version: 3.6
  install:
    - requirements: docs/requirements.txt
    - method: pip
      path: .
--- a/requirements.txt
+++ b/requirements.txt
@ -0,0 +1,9 @@
 -r test_requirements.txt
 black
 isort
 mypy
 flake8
 flake8-docstrings
 cohere
 openai
 google-search-results
--- a/setup.py
+++ b/setup.py
@ -0,0 +1,23 @@
 """Set up the package."""
 from pathlib import Path
 from setuptools import find_packages, setup
 with open(Path(__file__).absolute().parents[0] / "langchain" / "VERSION") as _f:
    __version__ = _f.read().strip()
 with open("README.md", "r") as f:
    long_description = f.read()
 setup(
    name="langchain",
    version=__version__,
    packages=find_packages(),
    description="Building applications with LLMs through composability",
    install_requires=["pydantic"],
    long_description=long_description,
    license="MIT",
    url="https://github.com/hwchase17/langchain",
    include_package_data=True,
    long_description_content_type="text/markdown",
 )
--- a/test_requirements.txt
+++ b/test_requirements.txt
@ -0,0 +1,3 @@
 -e .
 pytest
 pytest-dotenv
--- a/tests/init.py
+++ b/tests/init.py
@ -0,0 +1 @@
 """All tests for this package."""
--- a/tests/integration_tests/init.py
+++ b/tests/integration_tests/init.py
@ -0,0 +1 @@
 """All integration tests (tests that call out to an external API)."""
--- a/tests/integration_tests/chains/init.py
+++ b/tests/integration_tests/chains/init.py
@ -0,0 +1 @@
 """All integration tests for chains."""
--- a/tests/integration_tests/chains/test_self_ask_with_search.py
+++ b/tests/integration_tests/chains/test_self_ask_with_search.py
@ -0,0 +1,18 @@
 """Integration test for self ask with search."""
 from langchain.chains.self_ask_with_search.base import SelfAskWithSearchChain
 from langchain.chains.serpapi import SerpAPIChain
 from langchain.llms.openai import OpenAI
 def test_self_ask_with_search() -> None:
    """Test functionality on a prompt."""
    question = "What is the hometown of the reigning men's U.S. Open champion?"
    chain = SelfAskWithSearchChain(
        llm=OpenAI(temperature=0),
        search_chain=SerpAPIChain(),
        input_key="q",
        output_key="a",
    )
    answer = chain.run(question)
    final_answer = answer.split("\n")[-1]
    assert final_answer == "So the final answer is: El Palmar, Murcia, Spain"
--- a/tests/integration_tests/chains/test_serpapi.py
+++ b/tests/integration_tests/chains/test_serpapi.py
@ -0,0 +1,9 @@
 """Integration test for SerpAPI."""
 from langchain.chains.serpapi import SerpAPIChain
 def test_call() -> None:
    """Test that call gives the correct answer."""
    chain = SerpAPIChain()
    output = chain.search("What was Obama's first name?")
    assert output == "Barack Hussein Obama II"
--- a/tests/integration_tests/llms/init.py
+++ b/tests/integration_tests/llms/init.py
@ -0,0 +1 @@
 """All integration tests for LLM objects."""
--- a/tests/integration_tests/llms/test_cohere.py
+++ b/tests/integration_tests/llms/test_cohere.py
@ -0,0 +1,10 @@
 """Test Cohere API wrapper."""
 from langchain.llms.cohere import Cohere
 def test_cohere_call() -> None:
    """Test valid call to cohere."""
    llm = Cohere(max_tokens=10)
    output = llm("Say foo:")
    assert isinstance(output, str)
--- a/tests/integration_tests/llms/test_openai.py
+++ b/tests/integration_tests/llms/test_openai.py
@ -0,0 +1,10 @@
 """Test OpenAI API wrapper."""
 from langchain.llms.openai import OpenAI
 def test_cohere_call() -> None:
    """Test valid call to cohere."""
    llm = OpenAI(max_tokens=10)
    output = llm("Say foo:")
    assert isinstance(output, str)
--- a/tests/unit_tests/init.py
+++ b/tests/unit_tests/init.py
@ -0,0 +1 @@
 """All unit tests (lightweight tests)."""
--- a/tests/unit_tests/chains/init.py
+++ b/tests/unit_tests/chains/init.py
@ -0,0 +1 @@
 """Tests for correct functioning of chains."""
--- a/tests/unit_tests/chains/test_base.py
+++ b/tests/unit_tests/chains/test_base.py
@ -0,0 +1,50 @@
 """Test logic on base chain class."""
 from typing import Dict, List
 import pytest
 from pydantic import BaseModel
 from langchain.chains.base import Chain
 class FakeChain(Chain, BaseModel):
    """Fake chain class for testing purposes."""
    be_correct: bool = True
    @property
    def input_keys(self) -> List[str]:
        """Input key of foo."""
        return ["foo"]
    @property
    def output_keys(self) -> List[str]:
        """Output key of bar."""
        return ["bar"]
    def _run(self, inputs: Dict[str, str]) -> Dict[str, str]:
        if self.be_correct:
            return {"bar": "baz"}
        else:
            return {"baz": "bar"}
 def test_bad_inputs() -> None:
    """Test errors are raised if input keys are not found."""
    chain = FakeChain()
    with pytest.raises(ValueError):
        chain({"foobar": "baz"})
 def test_bad_outputs() -> None:
    """Test errors are raised if outputs keys are not found."""
    chain = FakeChain(be_correct=False)
    with pytest.raises(ValueError):
        chain({"foo": "baz"})
 def test_correct_call() -> None:
    """Test correct call of fake chain."""
    chain = FakeChain()
    output = chain({"foo": "bar"})
    assert output == {"foo": "bar", "bar": "baz"}
--- a/tests/unit_tests/chains/test_llm.py
+++ b/tests/unit_tests/chains/test_llm.py
@ -0,0 +1,36 @@
 """Test LLM chain."""
 import pytest
 from langchain.chains.llm import LLMChain
 from langchain.prompt import Prompt
 from tests.unit_tests.llms.fake_llm import FakeLLM
@pytest.fixture
 def fake_llm_chain() -> LLMChain:
    """Fake LLM chain for testing purposes."""
    prompt = Prompt(input_variables=["bar"], template="This is a {bar}:")
    return LLMChain(prompt=prompt, llm=FakeLLM(), output_key="text1")
 def test_missing_inputs(fake_llm_chain: LLMChain) -> None:
    """Test error is raised if inputs are missing."""
    with pytest.raises(ValueError):
        fake_llm_chain({"foo": "bar"})
 def test_valid_call(fake_llm_chain: LLMChain) -> None:
    """Test valid call of LLM chain."""
    output = fake_llm_chain({"bar": "baz"})
    assert output == {"bar": "baz", "text1": "foo"}
    # Test with stop words.
    output = fake_llm_chain({"bar": "baz", "stop": ["foo"]})
    # Response should be `bar` now.
    assert output == {"bar": "baz", "stop": ["foo"], "text1": "bar"}
 def test_predict_method(fake_llm_chain: LLMChain) -> None:
    """Test predict method works."""
    output = fake_llm_chain.predict(bar="baz")
    assert output == "foo"
--- a/tests/unit_tests/chains/test_llm_math.py
+++ b/tests/unit_tests/chains/test_llm_math.py
@ -0,0 +1,40 @@
 """Test LLM Math functionality."""
 import pytest
 from langchain.chains.llm_math.base import LLMMathChain
 from langchain.chains.llm_math.prompt import _PROMPT_TEMPLATE
 from tests.unit_tests.llms.fake_llm import FakeLLM
@pytest.fixture
 def fake_llm_math_chain() -> LLMMathChain:
    """Fake LLM Math chain for testing."""
    complex_question = _PROMPT_TEMPLATE.format(question="What is the square root of 2?")
    queries = {
        _PROMPT_TEMPLATE.format(question="What is 1 plus 1?"): "Answer: 2",
        complex_question: "```python\nprint(2**.5)\n```",
        _PROMPT_TEMPLATE.format(question="foo"): "foo",
    }
    fake_llm = FakeLLM(queries=queries)
    return LLMMathChain(llm=fake_llm, input_key="q", output_key="a")
 def test_simple_question(fake_llm_math_chain: LLMMathChain) -> None:
    """Test simple question that should not need python."""
    question = "What is 1 plus 1?"
    output = fake_llm_math_chain.run(question)
    assert output == "Answer: 2"
 def test_complex_question(fake_llm_math_chain: LLMMathChain) -> None:
    """Test complex question that should need python."""
    question = "What is the square root of 2?"
    output = fake_llm_math_chain.run(question)
    assert output == f"Answer: {2**.5}\n"
 def test_error(fake_llm_math_chain: LLMMathChain) -> None:
    """Test question that raises error."""
    with pytest.raises(ValueError):
        fake_llm_math_chain.run("foo")
--- a/tests/unit_tests/chains/test_python.py
+++ b/tests/unit_tests/chains/test_python.py
@ -0,0 +1,15 @@
 """Test python chain."""
 from langchain.chains.python import PythonChain
 def test_functionality() -> None:
    """Test correct functionality."""
    chain = PythonChain(input_key="code1", output_key="output1")
    code = "print(1 + 1)"
    output = chain({"code1": code})
    assert output == {"code1": code, "output1": "2\n"}
    # Test with the more user-friendly interface.
    simple_output = chain.run(code)
    assert simple_output == "2\n"
--- a/tests/unit_tests/data/prompts/prompt_extra_args.json
+++ b/tests/unit_tests/data/prompts/prompt_extra_args.json
@ -0,0 +1,5 @@
 {
  "input_variables": ["foo"],
  "template": "This is a {foo} test.",
  "bad_var": 1
 }
--- a/tests/unit_tests/data/prompts/prompt_missing_args.json
+++ b/tests/unit_tests/data/prompts/prompt_missing_args.json
@ -0,0 +1,3 @@
 {
  "input_variables": ["foo"]
 }
--- a/tests/unit_tests/data/prompts/simple_prompt.json
+++ b/tests/unit_tests/data/prompts/simple_prompt.json
@ -0,0 +1,4 @@
 {
  "input_variables": ["foo"],
  "template": "This is a {foo} test."
 }
--- a/tests/unit_tests/llms/init.py
+++ b/tests/unit_tests/llms/init.py
@ -0,0 +1 @@
 """All unit tests for LLM objects."""
--- a/tests/unit_tests/llms/fake_llm.py
+++ b/tests/unit_tests/llms/fake_llm.py
@ -0,0 +1,21 @@
 """Fake LLM wrapper for testing purposes."""
 from typing import List, Mapping, Optional
 from langchain.llms.base import LLM
 class FakeLLM(LLM):
    """Fake LLM wrapper for testing purposes."""
    def __init__(self, queries: Optional[Mapping] = None):
        """Initialize with optional lookup of queries."""
        self._queries = queries
    def __call__(self, prompt: str, stop: Optional[List[str]] = None) -> str:
        """Return `foo` if no stop words, otherwise `bar`."""
        if self._queries is not None:
            return self._queries[prompt]
        if stop is None:
            return "foo"
        else:
            return "bar"
--- a/tests/unit_tests/llms/test_cohere.py
+++ b/tests/unit_tests/llms/test_cohere.py
@ -0,0 +1,17 @@
 """Test helper functions for Cohere API."""
 from langchain.llms.cohere import remove_stop_tokens
 def test_remove_stop_tokens() -> None:
    """Test removing stop tokens when they occur."""
    text = "foo bar baz"
    output = remove_stop_tokens(text, ["moo", "baz"])
    assert output == "foo bar "
 def test_remove_stop_tokens_none() -> None:
    """Test removing stop tokens when they do not occur."""
    text = "foo bar baz"
    output = remove_stop_tokens(text, ["moo"])
    assert output == "foo bar baz"
--- a/tests/unit_tests/test_formatting.py
+++ b/tests/unit_tests/test_formatting.py
@ -0,0 +1,26 @@
 """Test formatting functionality."""
 import pytest
 from langchain.formatting import formatter
 def test_valid_formatting() -> None:
    """Test formatting works as expected."""
    template = "This is a {foo} test."
    output = formatter.format(template, foo="good")
    expected_output = "This is a good test."
    assert output == expected_output
 def test_does_not_allow_args() -> None:
    """Test formatting raises error when args are provided."""
    template = "This is a {} test."
    with pytest.raises(ValueError):
        formatter.format(template, "good")
 def test_does_not_allow_extra_kwargs() -> None:
    """Test formatting does not allow extra key word arguments."""
    template = "This is a {foo} test."
    with pytest.raises(KeyError):
        formatter.format(template, foo="good", bar="oops")
--- a/tests/unit_tests/test_prompt.py
+++ b/tests/unit_tests/test_prompt.py
@ -0,0 +1,47 @@
 """Test functionality related to prompts."""
 import pytest
 from langchain.prompt import Prompt
 def test_prompt_valid() -> None:
    """Test prompts can be constructed."""
    template = "This is a {foo} test."
    input_variables = ["foo"]
    prompt = Prompt(input_variables=input_variables, template=template)
    assert prompt.template == template
    assert prompt.input_variables == input_variables
 def test_prompt_missing_input_variables() -> None:
    """Test error is raised when input variables are not provided."""
    template = "This is a {foo} test."
    input_variables: list = []
    with pytest.raises(ValueError):
        Prompt(input_variables=input_variables, template=template)
 def test_prompt_extra_input_variables() -> None:
    """Test error is raised when there are too many input variables."""
    template = "This is a {foo} test."
    input_variables = ["foo", "bar"]
    with pytest.raises(ValueError):
        Prompt(input_variables=input_variables, template=template)
 def test_prompt_wrong_input_variables() -> None:
    """Test error is raised when name of input variable is wrong."""
    template = "This is a {foo} test."
    input_variables = ["bar"]
    with pytest.raises(ValueError):
        Prompt(input_variables=input_variables, template=template)
 def test_prompt_invalid_template_format() -> None:
    """Test initializing a prompt with invalid template format."""
    template = "This is a {foo} test."
    input_variables = ["foo"]
    with pytest.raises(ValueError):
        Prompt(
            input_variables=input_variables, template=template, template_format="bar"
        )
		`@ -0,0 +1,2 @@`
							`include langchain/VERSION`
							`include LICENSE`
		`@ -0,0 +1 @@`
							`"""All integration tests (tests that call out to an external API)."""`
		`@ -0,0 +1 @@`
							`"""All integration tests for LLM objects."""`
		`@ -0,0 +1 @@`
							`"""Tests for correct functioning of chains."""`