First main commit

2024-10-31 15:20:26 +00:00 · 2022-05-24 00:29:17 -07:00 · 2022-05-24 00:29:17 -07:00 · ed301be2a7
commit ed301be2a7
parent 6ada1f2d2c
31 changed files with 2863 additions and 0 deletions
--- a/.flake8
+++ b/.flake8
@ -0,0 +1,10 @@
+# This is our code-style check. We currently allow the following exceptions:
+#   - E731: do not assign a lambda expression, use a def
+#   - E402: module level import not at top of file
+#   - W503: line break before binary operator
+
+[flake8]
+exclude = .git
+max-line-length = 88
+ignore = E731, E402, W503
+per-file-ignores = __init__.py:F401
--- a/.github/ISSUE_TEMPLATE/bug_report.md
+++ b/.github/ISSUE_TEMPLATE/bug_report.md
@ -0,0 +1,28 @@
+---
+name: Bug report
+about: Create a report to help us improve
+
+---
+
+## Description of the bug
+A clear and concise description of what the bug is.
+
+## To Reproduce
+Steps to reproduce the behavior:
+1. Go to '...'
+2. Click on '....'
+3. Execute the code '...'
+If necessary, attach example data which can be used to replicate the issue.
+
+## Expected behavior
+A clear and concise description of what you expected to happen.
+
+## Error Logs/Screenshots
+If applicable, add error logs or screenshots to help explain your problem.
+
+## Environment (please complete the following information)
+ - OS: [e.g. Ubuntu 18.04]
+ - bootleg Version: [e.g. 0.6.0]
+
+## Additional context
+Add any other context about the problem here.
--- a/.github/ISSUE_TEMPLATE/feature_request.md
+++ b/.github/ISSUE_TEMPLATE/feature_request.md
@ -0,0 +1,19 @@
+---
+name: Feature request
+about: Suggest an idea for this project
+
+---
+
+## Description of the feature request
+
+**Is your feature request related to a problem? Please describe.**
+A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
+
+## Description of the solution you'd like
+A clear and concise description of what you want to happen.
+
+## Description of the alternatives you've considered
+A clear and concise description of any alternative solutions or features you've considered.
+
+## Additional context
+Add any other context or screenshots about the feature request here.
--- a/.github/workflows/ci.yaml
+++ b/.github/workflows/ci.yaml
@ -0,0 +1,65 @@
+name: CI
+
+on:
+    push:
+        branches:
+            - main
+    pull_request:
+        branches:
+            - main
+
+    # Allows you to run this workflow manually from the Actions tab
+    workflow_dispatch:
+
+jobs:
+    test:
+        runs-on: ${{ matrix.os }}
+        timeout-minutes: 30
+        strategy:
+            matrix:
+                os: [ubuntu-latest]
+                python-version: ["3.8", "3.9", "3.10"]
+        services:
+            # Label used to access the service container
+            redis:
+                # Docker Hub image
+                image: redislabs/redis
+                    # Set health checks to wait until redis has started
+                options: >-
+                    --health-cmd "redis-cli ping"
+                    --health-interval 10s
+                    --health-timeout 5s
+                    --health-retries 5
+                ports:
+                    # Maps port 6379 on service container to the host
+                    - 6379:6379
+        steps:
+            - uses: actions/checkout@v3
+            - uses: actions/setup-python@v3
+              with:
+                  python-version: ${{ matrix.python-version }}
+            - name: Install Poetry
+              uses: snok/install-poetry@v1
+              with:
+                  virtualenvs-in-project: true
+                  virtualenvs-create: true
+                  installer-parallel: true
+            - name: Load cached venv if cache exists
+              id: cached-poetry-deps
+              uses: actions/cache@v3
+              with:
+                  path: .venv
+                  key: venv-${{ runner.os }}-${{ matrix.python-version }}-${{ hashFiles('**/poetry.lock') }}
+            - name: Install dependencies
+              if: steps.cached-poetry-deps.outputs.cache-hit != 'true'
+              run: |
+                  poetry install --no-interaction --no-root
+            - name: Install Manifest
+              run: |
+                  make dev
+            - name: Run preliminary checks
+              run: |
+                  make check
+            - name: Test with pytest
+              run: |
+                  poetry run pytest tests
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1,120 @@
+runs/*
+
+*._*
+# Pickle Saved
+*.pt
+*.pk
+**/*.pt
+**/*.pk
+
+# PyCharm
+*.idea
+
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# C extensions
+*.so
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# PyInstaller
+#  Usually these files are written by a python script from a template
+#  before PyInstaller builds the exe, so as to inject date/other infos into it.
+*.manifest
+*.spec
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.coverage
+.coverage.*
+.cache
+nosetests.xml
+coverage.xml
+*.cover
+.hypothesis/
+.pytest_cache/
+
+# Translations
+*.mo
+*.pot
+
+# Django stuff:
+*.log
+local_settings.py
+db.sqlite3
+
+# Flask stuff:
+instance/
+.webassets-cache
+
+# Scrapy stuff:
+.scrapy
+
+# Sphinx documentation
+docs/_build/
+
+# PyBuilder
+target/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+# pyenv
+.python-version
+
+# celery beat schedule file
+celerybeat-schedule
+
+# SageMath parsed files
+*.sage.py
+
+# Environments
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Spyder project settings
+.spyderproject
+.spyproject
+
+# Rope project settings
+.ropeproject
+
+# mkdocs documentation
+/site
+
+# mypy
+.mypy_cache/
+
+*.tsv
+*.7z
+.DS_Store
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -0,0 +1,23 @@
+repos:
+    - repo: https://github.com/pre-commit/pre-commit-hooks
+      rev: v3.2.0
+      hooks:
+          - id: trailing-whitespace
+          - id: end-of-file-fixer
+          - id: check-yaml
+          - id: check-toml
+          - id: check-merge-conflict
+          - id: check-added-large-files
+    - repo: https://github.com/timothycrosley/isort
+      rev: 5.9.3
+      hooks:
+          - id: isort
+    - repo: https://github.com/psf/black
+      rev: 22.3.0
+      hooks:
+          - id: black
+            language_version: python3
+    - repo: https://gitlab.com/pycqa/flake8
+      rev: 3.9.2
+      hooks:
+          - id: flake8
--- a/28
+++ b/28
@ -0,0 +1,28 @@
+dev:
+	poetry install
+	poetry run pre-commit install
+
+test: dev check
+	poetry install
+	poetry run pytest tests
+
+format:
+	isort --atomic manifest/ tests/
+	black manifest/ tests/
+
+check:
+	isort -c manifest/ tests/
+	black manifest/ tests/ --check
+	flake8 manifest/ tests/
+	mypy manifest/
+
+clean:
+	pip uninstall -y manifest
+	rm -rf src/manifest.egg-info
+	rm -rf build/ dist/
+
+prune:
+	@bash -c "git fetch -p";
+	@bash -c "for branch in $(git branch -vv | grep ': gone]' | awk '{print $1}'); do git branch -d $branch; done";
+
+.PHONY: dev test clean check prune
--- a/README.md
+++ b/README.md
@ -1,2 +1,21 @@
 # manifest
 Prompt programming with FMs.
+
+# Install
+Download the code:
+```
+git clone git@github.com:HazyResearch/manifest.git
+cd manifest
+```
+
+Install:
+```
+pip install poetry
+poetry install
+poetry run pre-commit install
+```
+or
+```
+pip install poetry
+make dev
+```
--- a/manifest/init.py
+++ b/manifest/init.py
@ -0,0 +1,3 @@
+"""Manifest init."""
+from manifest.manifest import Manifest
+from manifest.prompt import Prompt
--- a/manifest/api/app.py
+++ b/manifest/api/app.py
@ -0,0 +1 @@
+"""Flask app."""
--- a/manifest/api/models/huggingface_model.py
+++ b/manifest/api/models/huggingface_model.py
@ -0,0 +1 @@
+"""Huggingface model."""
--- a/manifest/api/models/model.py
+++ b/manifest/api/models/model.py
@ -0,0 +1 @@
+"""Model class."""
--- a/manifest/caches/init.py
+++ b/manifest/caches/init.py
@ -0,0 +1,2 @@
+"""Cache init."""
+from manifest.caches.cache import Cache
--- a/manifest/caches/cache.py
+++ b/manifest/caches/cache.py
@ -0,0 +1,113 @@
+"""Cache for queries and responses."""
+import json
+from abc import ABC, abstractmethod
+from typing import Any, Callable, Dict, Tuple, Union
+
+from manifest.clients.response import Response
+
+
+def request_to_key(request: Dict) -> str:
+    """
+    Normalize a request into a key.
+
+    Args:
+        request: request to normalize.
+
+    Returns:
+        normalized key.
+    """
+    return json.dumps(request, sort_keys=True)
+
+
+def key_to_request(key: str) -> Dict:
+    """
+    Convert the normalized version to the request.
+
+    Args:
+        key: normalized key to convert.
+
+    Returns:
+        unnormalized request dict.
+    """
+    return json.loads(key)
+
+
+class Cache(ABC):
+    """A cache for request/response pairs."""
+
+    def __init__(self, connection_str: str, **kwargs: Any):
+        """
+        Initialize client.
+
+        kwargs are passed to client as default parameters.
+
+        For clients like OpenAI that do not require a connection,
+        the connection_str can be None.
+
+        Args:
+            connection_str: connection string for client.
+        """
+        self.connect(connection_str, **kwargs)
+
+    @abstractmethod
+    def close(self) -> None:
+        """Close the client."""
+        raise NotImplementedError()
+
+    @abstractmethod
+    def connect(self, connection_str: str, **kwargs: Any) -> None:
+        """
+        Connect to client.
+
+        Args:
+            connection_str: connection string.
+        """
+        raise NotImplementedError()
+
+    @abstractmethod
+    def get_key(self, key: str, table: str = "default") -> Union[str, None]:
+        """
+        Get the key for a request.
+
+        With return None if key is not in cache.
+
+        Args:
+            key: key for cache.
+            table: table to get key in.
+        """
+        raise NotImplementedError()
+
+    @abstractmethod
+    def set_key(self, key: str, value: str, table: str = "default") -> None:
+        """
+        Set the value for the key.
+
+        Will override old value.
+
+        Args:
+            key: key for cache.
+            value: new value for key.
+            table: table to set key in.
+        """
+        raise NotImplementedError()
+
+    @abstractmethod
+    def commit(self) -> None:
+        """Commit any results."""
+        raise NotImplementedError()
+
+    def get(
+        self, request: Dict, overwrite_cache: bool, compute: Callable[[], Response]
+    ) -> Tuple[Response, bool]:
+        """Get the result of request (by calling compute as needed)."""
+        key = request_to_key(request)
+        cached_response = self.get_key(key)
+        if cached_response and not overwrite_cache:
+            cached = True
+            response = Response.deserialize(cached_response)
+        else:
+            # Type Response
+            response = compute()
+            self.set_key(key, response.serialize())
+            cached = False
+        return response, cached
--- a/manifest/caches/redis.py
+++ b/manifest/caches/redis.py
@ -0,0 +1,52 @@
+"""Redis cache."""
+from typing import Any, Union
+
+import redis
+
+from manifest.caches import Cache
+
+
+class RedisCache(Cache):
+    """A Redis cache for request/response pairs."""
+
+    def connect(self, connection_str: str, **kwargs: Any) -> None:
+        """
+        Connect to client.
+
+        Args:
+            connection_str: connection string.
+        """
+        host, port = connection_str.split(":")
+        self.redis = redis.Redis(host=host, port=int(port))
+        return
+
+    def close(self) -> None:
+        """Close the client."""
+        self.redis.close()
+
+    def get_key(self, key: str, table: str = "default") -> Union[str, None]:
+        """
+        Get the key for a request.
+
+        With return None if key is not in cache.
+
+        Args:
+            key: key for cache.
+        """
+        pass
+
+    def set_key(self, key: str, value: str, table: str = "default") -> None:
+        """
+        Set the value for the key.
+
+        Will override old value.
+
+        Args:
+            key: key for cache.
+            value: new value for key.
+        """
+        self.redis[key] = value
+
+    def commit(self) -> None:
+        """Commit any results."""
+        pass
--- a/manifest/caches/sqlite.py
+++ b/manifest/caches/sqlite.py
@ -0,0 +1,79 @@
+"""SQLite cache."""
+import logging
+from pathlib import Path
+from typing import Any, Union
+
+from sqlitedict import SqliteDict
+
+from manifest.caches import Cache
+
+logging.getLogger("sqlitedict").setLevel(logging.WARNING)
+
+
+class SQLiteCache(Cache):
+    """A SQLite cache for request/response pairs."""
+
+    def connect(self, connection_str: str, **kwargs: Any) -> None:
+        """
+        Connect to client.
+
+        Args:
+            connection_str: connection string.
+        """
+        self.cache_dir = connection_str
+        Path(self.cache_dir).mkdir(parents=True, exist_ok=True)
+        # If more than two tables, switch to full on SQL connection
+        self.query_file = Path(self.cache_dir, "query.sqlite")
+        self.prompt_file = Path(self.cache_dir, "prompts.sqlite")
+        self.cache = SqliteDict(self.query_file, autocommit=False)
+        self.prompt_cache = SqliteDict(self.prompt_file, autocommit=False)
+        return
+
+    def close(self) -> None:
+        """Close the client."""
+        self.cache.close()
+
+    def get_key(self, key: str, table: str = "default") -> Union[str, None]:
+        """
+        Get the key for a request.
+
+        With return None if key is not in cache.
+
+        Args:
+            key: key for cache.
+            table: table to get key in.
+        """
+        if table == "prompt":
+            return self.prompt_cache.get(key)
+        else:
+            if table != "default":
+                raise ValueError(
+                    "SQLiteDict only support table of `default` or `prompt`"
+                )
+        return self.cache.get(key)
+
+    def set_key(self, key: str, value: str, table: str = "default") -> None:
+        """
+        Set the value for the key.
+
+        Will override old value.
+
+        Args:
+            key: key for cache.
+            value: new value for key.
+            table: table to set key in.
+        """
+        if table == "prompt":
+            self.prompt_cache[key] = value
+        else:
+            if table != "default":
+                raise ValueError(
+                    "SQLiteDict only support table of `default` or `prompt`"
+                )
+            self.cache[key] = value
+        self.commit()
+
+    def commit(self) -> None:
+        """Commit any results."""
+        self.prompt_cache.commit()
+        self.cache.commit()
--- a/manifest/clients/init.py
+++ b/manifest/clients/init.py
@ -0,0 +1,3 @@
+"""Client init."""
+from manifest.clients.client import Client
+from manifest.clients.response import Response
--- a/manifest/clients/client.py
+++ b/manifest/clients/client.py
@ -0,0 +1,58 @@
+"""Client class."""
+from abc import ABC, abstractmethod
+from typing import Any, Callable, Dict, Optional, Tuple
+
+from manifest.clients import Response
+
+
+class Client(ABC):
+    """Client class."""
+
+    def __init__(self, connection_str: Optional[str] = None, **kwargs: Any):
+        """
+        Initialize client.
+
+        kwargs are passed to client as default parameters.
+
+        For clients like OpenAI that do not require a connection,
+        the connection_str can be None.
+
+        Args:
+            connection_str: connection string for client.
+        """
+        self.connect(connection_str, **kwargs)
+
+    @abstractmethod
+    def close(self) -> None:
+        """Close the client."""
+        raise NotImplementedError()
+
+    @abstractmethod
+    def connect(self, connection_str: str, **kwargs: Any) -> None:
+        """
+        Connect to client.
+
+        Args:
+            connection_str: connection string.
+        """
+        raise NotImplementedError()
+
+    @abstractmethod
+    def get_request(
+        self, query: str, **kwargs: Any
+    ) -> Tuple[Callable[[], Response], Dict]:
+        """
+        Get request function.
+
+        kwargs override default parameters.
+
+        Calling the returned function will run the request.
+
+        Args:
+            query: query string.
+
+        Returns:
+            request function that takes no input.
+            request parameters as dict.
+        """
+        raise NotImplementedError()
--- a/manifest/clients/dummy.py
+++ b/manifest/clients/dummy.py
@ -0,0 +1,52 @@
+"""Dummy client."""
+import logging
+from typing import Any, Callable, Dict, Optional, Tuple
+
+from manifest.clients import Client
+from manifest.clients.response import Response
+
+logger = logging.getLogger(__name__)
+
+
+class DummyClient(Client):
+    """Dummy client."""
+
+    def connect(
+        self,
+        connection_str: Optional[str] = None,
+        num_results: Optional[int] = 1,
+        **kwargs: Any,
+    ) -> None:
+        """
+        Connect to dummpy server.
+
+        This is a dummy client that returns identity responses. Used for testing.
+        """
+        self.num_results = num_results
+
+    def close(self) -> None:
+        """Close the client."""
+        pass
+
+    def get_request(
+        self, query: str, **kwargs: Any
+    ) -> Tuple[Callable[[], Response], Dict]:
+        """
+        Get request string function.
+
+        Args:
+            query: query string.
+
+        Returns:
+            request function that takes no input.
+            request parameters as dict.
+        """
+        request_params = {
+            "prompt": query,
+            "num_results": kwargs.get("num_results", self.num_results),
+        }
+
+        def _run_completion() -> Response:
+            return Response({"choices": [{"text": "hello"}] * self.num_results})
+
+        return _run_completion, request_params
--- a/manifest/clients/openai.py
+++ b/manifest/clients/openai.py
@ -0,0 +1,95 @@
+"""OpenAI client."""
+import logging
+import os
+from typing import Any, Callable, Dict, Optional, Tuple
+
+import openai
+
+from manifest.clients import Response
+from manifest.clients.client import Client
+
+logging.getLogger("openai").setLevel(logging.WARNING)
+logger = logging.getLogger(__name__)
+
+OPENAI_ENGINES = {
+    "text-davinci-002",
+    "text-curie-001",
+    "text-babbage-001",
+    "text-ada-001",
+}
+
+
+class OpenAIClient(Client):
+    """OpenAI client."""
+
+    def connect(
+        self,
+        connection_str: Optional[str] = None,
+        engine: Optional[str] = "text-ada-001",
+        temperature: Optional[float] = 0.0,
+        max_tokens: Optional[int] = 10,
+        top_p: Optional[int] = 1,
+        frequency_penalty: Optional[int] = 0,
+        presence_penalty: Optional[int] = 0,
+        n: Optional[int] = 1,
+        **kwargs: Any,
+    ) -> None:
+        """
+        Connect to the OpenAI server.
+
+        connection_str is passed as default OPENAI_API_KEY if variable not set.
+        """
+        openai.api_key = os.environ.get("OPENAI_API_KEY", connection_str)
+        if openai.api_key is None:
+            raise ValueError(
+                "OpenAI API key not set. Set OPENAI_API_KEY environment ",
+                "svariable or pass through `connection_str`.",
+            )
+        self.engine = engine
+        if self.engine not in OPENAI_ENGINES:
+            raise ValueError(f"Invalid engine {self.engine}. Must be {OPENAI_ENGINES}.")
+        self.temperature = temperature
+        self.max_tokens = max_tokens
+        self.top_p = top_p
+        self.frequency_penalty = frequency_penalty
+        self.presence_penalty = presence_penalty
+        self.n = n
+
+    def close(self) -> None:
+        """Close the client."""
+        pass
+
+    def get_request(
+        self, query: str, **kwargs: Any
+    ) -> Tuple[Callable[[], Response], Dict]:
+        """
+        Get request string function.
+
+        Args:
+            query: query string.
+
+        Returns:
+            request function that takes no input.
+            request parameters as dict.
+        """
+        request_params = {
+            "engine": kwargs.get("engine", self.engine),
+            "prompt": query,
+            "temperature": kwargs.get("temperature", self.temperature),
+            "max_tokens": kwargs.get("max_tokens", self.max_tokens),
+            "top_p": kwargs.get("top_p", self.top_p),
+            "frequency_penalty": kwargs.get(
+                "frequency_penalty", self.frequency_penalty
+            ),
+            "presence_penalty": kwargs.get("presence_penalty", self.presence_penalty),
+            "n": kwargs.get("n", self.n),
+        }
+
+        def _run_completion() -> Response:
+            try:
+                return Response(openai.Completion.create(**request_params))
+            except openai.error.OpenAIError as e:
+                logger.error(e)
+                raise e
+
+        return _run_completion, request_params
--- a/manifest/clients/response.py
+++ b/manifest/clients/response.py
@ -0,0 +1,70 @@
+"""Client response."""
+import json
+from typing import Dict, List, Union
+
+
+class Response:
+    """Response class."""
+
+    def __init__(self, response: Union[str, Dict]):
+        """Initialize response."""
+        if isinstance(response, str):
+            self.response = json.loads(response)
+        elif isinstance(response, dict):
+            self.response = response
+        else:
+            raise ValueError("Response must be str or dict")
+        if ("choices" not in self.response) or (
+            not isinstance(self.response["choices"], list)
+        ):
+            raise ValueError(
+                "Response must be serialized to a dict with a list of choices"
+            )
+        if len(self.response["choices"]) > 0:
+            if "text" not in self.response["choices"][0]:
+                raise ValueError(
+                    "Response must be serialized to a dict with a ",
+                    "list of choices with text field",
+                )
+
+    def __getitem__(self, key: str) -> str:
+        """
+        Return the response given the key.
+
+        Args:
+            key: key to get.
+
+        Returns:
+            value of key.
+        """
+        return self.response[key]
+
+    def get_results(self) -> Union[str, List[str]]:
+        """Get all text results from response."""
+        if len(self.response["choices"]) == 0:
+            return None
+        if len(self.response["choices"]) == 1:
+            return self.response["choices"][0]["text"]
+        return [choice["text"] for choice in self.response["choices"]]
+
+    def serialize(self) -> str:
+        """
+        Serialize response to string.
+
+        Returns:
+            serialized response.
+        """
+        return json.dumps(self.response, sort_keys=True)
+
+    @classmethod
+    def deserialize(cls, value: str) -> "Response":
+        """
+        Deserialize string to response.
+
+        Args:
+            value: serialized response.
+
+        Returns:
+            serialized response.
+        """
+        return Response(value)
--- a/manifest/manifest.py
+++ b/manifest/manifest.py
@ -0,0 +1,138 @@
+"""Manifest class."""
+import logging
+from typing import Any, Iterable, List, Optional, Union
+
+logging.getLogger("openai").setLevel(logging.WARNING)
+logger = logging.getLogger(__name__)
+
+from manifest import Prompt
+from manifest.caches.redis import RedisCache
+from manifest.caches.sqlite import SQLiteCache
+from manifest.clients.dummy import DummyClient
+from manifest.clients.openai import OpenAIClient
+
+CLIENT_CONSTRUCTORS = {
+    "openai": OpenAIClient,
+    # "huggingface": manifest.clients.huggingface.HuggingFaceClient,
+    "dummy": DummyClient,
+}
+
+CACHE_CONSTRUCTORS = {
+    "redis": RedisCache,
+    "sqlite": SQLiteCache,
+}
+
+
+class Manifest:
+    """Manifest session object."""
+
+    def __init__(
+        self,
+        client_name: str = "openai",
+        client_connection: Optional[str] = None,
+        cache_name: str = "redis",
+        cache_connection: str = "localhost:6379",
+        **kwargs: Any,
+    ):
+        """
+        Initialize manifest.
+
+        Remaining kwargs sent to client and cache.
+        """
+        if client_name not in CLIENT_CONSTRUCTORS:
+            raise ValueError(
+                f"Unknown client name: {client_name}. "
+                f"Choices are {list(CLIENT_CONSTRUCTORS.keys())}"
+            )
+        if cache_name not in CACHE_CONSTRUCTORS:
+            raise ValueError(
+                f"Unknown cache name: {cache_name}. "
+                f"Choices are {list(CACHE_CONSTRUCTORS.keys())}"
+            )
+        self.client_name = client_name
+        self.client = CLIENT_CONSTRUCTORS[client_name](client_connection, **kwargs)
+        self.cache = CACHE_CONSTRUCTORS[cache_name](cache_connection, **kwargs)
+
+    def close(self) -> None:
+        """Close the client and cache."""
+        self.client.close()
+        self.cache.close()
+
+    def run(
+        self,
+        prompt: Prompt,
+        input: Optional[Any] = None,
+        overwrite_cache: bool = False,
+        **kwargs: Any,
+    ) -> Union[str, List[str]]:
+        """
+        Run the prompt.
+
+        Args:
+            prompt: prompt to run.
+            input: input to prompt.
+            overwrite_cache: whether to overwrite cache.
+
+        Returns:
+            response from prompt.
+        """
+        prompt_str = prompt(input)
+        possible_request, full_kwargs = self.client.get_request(prompt_str, **kwargs)
+        # Create cacke key
+        cache_key = full_kwargs.copy()
+        # Make query model dependent
+        cache_key["client_name"] = self.client_name
+        # Make query prompt dependent
+        cache_key["prompt"] = prompt_str
+        response, _ = self.cache.get(cache_key, overwrite_cache, possible_request)
+        return response.get_results()
+
+    def run_batch(
+        self,
+        prompt: Prompt,
+        input: Optional[Iterable[Any]] = None,
+        overwrite_cache: bool = False,
+        **kwargs: Any,
+    ) -> Iterable[Union[str, List[str]]]:
+        """
+        Run the prompt on a batch of inputs.
+
+        Args:
+            prompt: prompt to run.
+            input: batch of inputs.
+            overwrite_cache: whether to overwrite cache.
+
+        Returns:
+            batch of responses.
+        """
+        if input is None:
+            input = [None]
+        return [self.run(prompt, inp, overwrite_cache, **kwargs) for inp in input]
+
+    def save_prompt(self, name: str, prompt: Prompt) -> None:
+        """
+        Save the prompt to the cache for long term storage.
+
+        Args:
+            name: name of prompt.
+            prompt: prompt to save.
+        """
+        self.cache.set_key(name, prompt.serialize(), table="prompt")
+
+    def load_prompt(self, name: str) -> Prompt:
+        """
+        Load the prompt from the cache.
+
+        Args:
+            name: name of prompt.
+
+        Returns:
+            Prompt saved with name.
+        """
+        return Prompt.deserialize(self.cache.get_key(name, table="prompt"))
+
+    def open_explorer(self) -> None:
+        """Open the explorer for jupyter widget."""
+        # Open explorer
+        # TODO: implement
+        pass
--- a/manifest/prompt.py
+++ b/manifest/prompt.py
@ -0,0 +1,72 @@
+"""Prompt class."""
+
+import inspect
+import logging
+from typing import Any, Callable, List, Optional, Union
+
+logging.getLogger("openai").setLevel(logging.WARNING)
+logger = logging.getLogger(__name__)
+
+
+class Prompt:
+    """Prompt class."""
+
+    def __init__(self, prompt_obj: Union[str, Callable, "Prompt", List["Prompt"]]):
+        """
+        Initialize prompt.
+
+        If prompt_obj is a string, it will be cast as function.
+        If prompt_obj is list of promts, it will be composed.
+        """
+        # TODO: figure out how to compose prompts to keep the
+        # interface simple? Can we make a function
+        # such that a single call will run the composition?
+        if isinstance(prompt_obj, str):
+            self.prompt_func = lambda: prompt_obj
+        elif callable(prompt_obj):
+            self.prompt_func = prompt_obj
+        else:
+            # TODO: implement
+            raise NotImplementedError()
+        self.num_args = len(inspect.signature(self.prompt_func).parameters)
+        if self.num_args > 1:
+            raise ValueError("Prompts must have zero or one input.")
+
+    def __call__(self, input: Optional[Any] = None) -> str:
+        """
+        Return the prompt given the inputs.
+
+        Args:
+            input: input to prompt.
+
+        Returns:
+            prompt string.
+        """
+        if self.num_args >= 1:
+            return self.prompt_func(input)  # type: ignore
+        else:
+            return self.prompt_func()
+
+    def serialize(self) -> str:
+        """
+        Return the prompt as str.
+
+        Returns:
+            json object.
+        """
+        # TODO: implement
+        pass
+
+    @classmethod
+    def deserialize(cls, obj: str) -> "Prompt":
+        """
+        Return the prompt from a json object.
+
+        Args:
+            obj: json object.
+
+        Return:
+            prompt.
+        """
+        # TODO: implement
+        pass
--- a/poetry.lock
+++ b/poetry.lock
--- a/pyproject.toml
+++ b/pyproject.toml
@ -0,0 +1,69 @@
+[tool.poetry]
+authors = ["Laurel Orr <lorr1@cs.stanford.edu>, Avanika Narayan <avanikan@stanford.edu>"]
+classifiers = [
+  "Programming Language :: Python",
+  "Programming Language :: Python :: 3",
+  "Programming Language :: Python :: 3.8",
+  "Programming Language :: Python :: 3.9",
+  "Programming Language :: Python :: 3.10"
+]
+description = "Manifest for Prompt Programming"
+name = "manifest"
+repository = "https://github.com/HazyResearch/manifest"
+version = "0.0.1"
+
+[tool.poetry.urls]
+"Bug Tracker" = "https://github.com/HazyResearch/manifest/issues"
+
+[tool.poetry.dependencies]
+python = "^3.8"
+sqlitedict = "^2.0.0"
+openai = "^0.18.1"
+redis = "^4.3.1"
+
+[tool.poetry.dev-dependencies]
+black = "^22.3.0"
+flake8 = "^4.0.0"
+flake8-docstrings = "^1.6.0"
+isort = "^5.9.3"
+mypy = "^0.950"
+pep8-naming = "^0.12.1"
+pre-commit = "^2.14.0"
+pytest = "^7.0.0"
+pytest-cov = "^3.0.0"
+python-dotenv = "^0.20.0"
+recommonmark = "^0.7.1"
+
+[build-system]
+build-backend = "poetry.core.masonry.api"
+requires = ["poetry-core>=1.0.0"]
+
+# Additional Tool Configurations
+[tool.mypy]
+disallow_untyped_defs = true
+strict_optional = false
+
+[[tool.mypy.overrides]]
+ignore_missing_imports = true
+module = [
+  "numpy",
+  "tqdm",
+  "sqlitedict",
+]
+
+[tool.isort]
+combine_as_imports = true
+force_grid_wrap = 0
+include_trailing_comma = true
+known_first_party = ["manifest"]
+line_length = 88
+multi_line_output = 3
+
+[tool.pytest.ini_options]
+log_format = "[%(levelname)s] %(message)s"
+log_date_format = "%Y-%m-%d %H:%M:%S"
+addopts = "-v -rsXx"
+# The following options are useful for local debugging
+# addopts = "-v -rsXx -s -x --pdb"
+# log_cli_level = "DEBUG"
+# log_cli = true
--- a/tests/clients/test_client.py
+++ b/tests/clients/test_client.py
@ -0,0 +1 @@
+"""Test client."""
--- a/tests/clients/test_response.py
+++ b/tests/clients/test_response.py
@ -0,0 +1,59 @@
+"""Response test."""
+import json
+
+import pytest
+
+from manifest.clients import Response
+
+
+def test_init():
+    """Test response initialization."""
+    with pytest.raises(ValueError) as exc_info:
+        response = Response(4)
+    assert str(exc_info.value) == "Response must be str or dict"
+    with pytest.raises(ValueError) as exc_info:
+        response = Response({"test": "hello"})
+    assert (
+        str(exc_info.value)
+        == "Response must be serialized to a dict with a list of choices"
+    )
+    with pytest.raises(ValueError) as exc_info:
+        response = Response({"choices": [{"blah": "hello"}]})
+    assert str(exc_info.value) == (
+        "Response must be serialized to a dict ",
+        "with a list of choices with text field",
+    )
+
+    response = Response({"choices": [{"text": "hello"}]})
+    assert response.response == {"choices": [{"text": "hello"}]}
+
+    response = Response(json.dumps({"choices": [{"text": "hello"}]}))
+    assert response.response == {"choices": [{"text": "hello"}]}
+
+
+def test_getitem():
+    """Test response getitem."""
+    response = Response({"choices": [{"text": "hello"}]})
+    assert response["choices"] == [{"text": "hello"}]
+
+
+def test_serialize():
+    """Test response serialization."""
+    response = Response({"choices": [{"text": "hello"}]})
+    assert Response.deserialize(response.serialize()).response == {
+        "choices": [{"text": "hello"}]
+    }
+
+
+def test_get_results():
+    """Test response get results."""
+    response = Response({"choices": []})
+    assert response.get_results() is None
+
+    response = Response({"choices": [{"text": "hello"}]})
+    assert response.get_results() == "hello"
+
+    response = Response(
+        {"choices": [{"text": "hello"}, {"text": "my"}, {"text": "name"}]}
+    )
+    assert response.get_results() == ["hello", "my", "name"]
--- a/tests/conftest.py
+++ b/tests/conftest.py
@ -0,0 +1,36 @@
+"""Setup for all tests."""
+import os
+import shutil
+
+import pytest
+
+
+@pytest.fixture
+def sqlite_cache(tmp_path):
+    """Sqlite Cache."""
+    cache = str(tmp_path / "sqlite_cache.sqlite")
+    yield cache
+    shutil.rmtree(cache, ignore_errors=True)
+
+
+@pytest.fixture
+def redis_cache():
+    """Redis cache."""
+    if "CI" not in os.environ:
+        # Give a clear warning on setting REDIS_PORT before running tests.
+        try:
+            port = os.environ["REDIS_PORT"]
+        except KeyError:
+            raise KeyError(
+                "Set REDIS_PORT env var to the instance you want to use "
+                + "for testing. Note that doing so WILL delete the db at "
+                + "localhost:REDIS_PORT, db=0, so BE CAREFUL."
+            )
+        host = os.environ.get("REDIS_HOST", "localhost")
+    else:
+        host = os.environ.get("REDIS_HOST", "localhost")
+        port = os.environ.get("REDIS_PORT", 6379)
+    yield f"{host}:{port}"
+    # Clear out the database
+    # db = redis.Redis(host=host, port=port)
+    # db.flushdb()
--- a/tests/test_cache.py
+++ b/tests/test_cache.py
@ -0,0 +1,69 @@
+"""Cache test."""
+import pytest
+from sqlitedict import SqliteDict
+
+from manifest.caches.redis import RedisCache
+from manifest.caches.sqlite import SQLiteCache
+from manifest.clients import Response
+
+
+@pytest.mark.usefixtures("sqlite_cache")
+@pytest.mark.usefixtures("redis_cache")
+@pytest.mark.parametrize("cache_type", ["sqlite"])
+def test_init(sqlite_cache, redis_cache, cache_type):
+    """Test cache initialization."""
+    if cache_type == "sqlite":
+        cache = SQLiteCache(sqlite_cache)
+        assert isinstance(cache.cache, SqliteDict)
+        assert isinstance(cache.prompt_cache, SqliteDict)
+    else:
+        cache = RedisCache(redis_cache)
+
+
+@pytest.mark.usefixtures("sqlite_cache")
+@pytest.mark.usefixtures("redis_cache")
+@pytest.mark.parametrize("cache_type", ["sqlite"])
+def test_key_get_and_set(sqlite_cache, redis_cache, cache_type):
+    """Test cache key get and set."""
+    if cache_type == "sqlite":
+        cache = SQLiteCache(sqlite_cache)
+    else:
+        cache = RedisCache(redis_cache)
+
+    cache.set_key("test", "valueA")
+    cache.set_key("testA", "valueB")
+
+    assert cache.get_key("test") == "valueA"
+    assert cache.get_key("testA") == "valueB"
+
+    cache.set_key("testA", "valueC")
+    assert cache.get_key("testA") == "valueC"
+
+    cache.get_key("test", table="prompt") is None
+    cache.set_key("test", "valueA", table="prompt")
+    cache.get_key("test", table="prompt") == "valueA"
+
+
+@pytest.mark.usefixtures("sqlite_cache")
+@pytest.mark.usefixtures("redis_cache")
+@pytest.mark.parametrize("cache_type", ["sqlite"])
+def test_get(sqlite_cache, redis_cache, cache_type):
+    """Test cache save prompt."""
+    if cache_type == "sqlite":
+        cache = SQLiteCache(sqlite_cache)
+    else:
+        cache = RedisCache(redis_cache)
+    test_request = {"test": "hello", "testA": "world"}
+    compute = lambda: Response({"choices": [{"text": "hello"}]})
+
+    response, cached = cache.get(test_request, overwrite_cache=False, compute=compute)
+    assert response.get_results() == "hello"
+    assert not cached
+
+    response, cached = cache.get(test_request, overwrite_cache=False, compute=compute)
+    assert response.get_results() == "hello"
+    assert cached
+
+    response, cached = cache.get(test_request, overwrite_cache=True, compute=compute)
+    assert response.get_results() == "hello"
+    assert not cached
--- a/tests/test_manifest.py
+++ b/tests/test_manifest.py
@ -0,0 +1,105 @@
+"""Manifest test."""
+import pytest
+
+from manifest import Manifest, Prompt
+from manifest.caches.cache import request_to_key
+from manifest.caches.sqlite import SQLiteCache
+from manifest.clients.dummy import DummyClient
+
+
+@pytest.mark.usefixtures("sqlite_cache")
+def test_init(sqlite_cache):
+    """Test manifest initialization."""
+    manifest = Manifest(
+        client_name="dummy",
+        cache_name="sqlite",
+        cache_connection=sqlite_cache,
+    )
+    assert manifest.client_name == "dummy"
+    assert isinstance(manifest.client, DummyClient)
+    assert isinstance(manifest.cache, SQLiteCache)
+
+    manifest = Manifest(
+        client_name="dummy",
+        cache_name="sqlite",
+        cache_connection=sqlite_cache,
+        num_results=3,
+    )
+    assert manifest.client_name == "dummy"
+    assert isinstance(manifest.client, DummyClient)
+    assert isinstance(manifest.cache, SQLiteCache)
+    assert manifest.client.num_results == 3
+
+
+@pytest.mark.usefixtures("sqlite_cache")
+@pytest.mark.parametrize("num_results", [1, 2])
+def test_run(sqlite_cache, num_results):
+    """Test manifest run."""
+    manifest = Manifest(
+        client_name="dummy",
+        cache_name="sqlite",
+        cache_connection=sqlite_cache,
+        num_results=num_results,
+    )
+    prompt = Prompt("This is a prompt")
+    res = manifest.run(prompt)
+    assert (
+        manifest.cache.get_key(
+            request_to_key(
+                {
+                    "prompt": "This is a prompt",
+                    "client_name": "dummy",
+                    "num_results": num_results,
+                }
+            )
+        )
+        is not None
+    )
+    if num_results == 1:
+        assert res == "hello"
+    else:
+        assert res == ["hello", "hello"]
+
+    prompt = Prompt(lambda x: f"{x} is a prompt")
+    res = manifest.run(prompt, "Hello")
+    assert (
+        manifest.cache.get_key(
+            request_to_key(
+                {
+                    "prompt": "Hello is a prompt",
+                    "client_name": "dummy",
+                    "num_results": num_results,
+                }
+            )
+        )
+        is not None
+    )
+    if num_results == 1:
+        assert res == "hello"
+    else:
+        assert res == ["hello", "hello"]
+
+
+@pytest.mark.usefixtures("sqlite_cache")
+@pytest.mark.parametrize("num_results", [1, 2])
+def test_batch_run(sqlite_cache, num_results):
+    """Test manifest run."""
+    manifest = Manifest(
+        client_name="dummy",
+        cache_name="sqlite",
+        cache_connection=sqlite_cache,
+        num_results=num_results,
+    )
+    prompt = Prompt("This is a prompt")
+    res = manifest.run_batch(prompt)
+    if num_results == 1:
+        assert res == ["hello"]
+    else:
+        assert res == [["hello", "hello"]]
+
+    prompt = Prompt(lambda x: f"{x} is a prompt")
+    res = manifest.run_batch(prompt, ["Hello", "Hello"])
+    if num_results == 1:
+        assert res == ["hello", "hello"]
+    else:
+        assert res == [["hello", "hello"], ["hello", "hello"]]
--- a/tests/test_prompt.py
+++ b/tests/test_prompt.py
@ -0,0 +1,54 @@
+"""Prompt test."""
+import pytest
+
+from manifest import Prompt
+
+
+def test_init():
+    """Test prompt initialization."""
+    str_prompt = "This is a test prompt"
+    func_prompt = lambda: "This is a test prompt"
+    func_single_prompt = lambda x: f"{x} is a test prompt"
+    func_list_prompt = lambda x: f"{x[0]} is a test {x[1]}"
+    func_double_prompt = lambda x, y: f"{x} is a test {y}"
+    # TODO: add list of prompt tests
+
+    # String prompt
+    prompt = Prompt(str_prompt)
+    assert prompt(None) == str_prompt
+    assert prompt() == str_prompt
+
+    # Function no inputs
+    prompt = Prompt(func_prompt)
+    assert prompt(None) == str_prompt
+    assert prompt() == str_prompt
+
+    # Function single inputs
+    prompt = Prompt(func_single_prompt)
+    assert prompt("This") == str_prompt
+    assert prompt("Hello") == "Hello is a test prompt"
+
+    # Function list inputs
+    prompt = Prompt(func_list_prompt)
+    assert prompt(["This", "prompt"]) == str_prompt
+    assert prompt(["Hello", "prompt"]) == "Hello is a test prompt"
+
+    # Function two inputs
+    with pytest.raises(ValueError) as exc_info:
+        Prompt(func_double_prompt)
+    assert str(exc_info.value) == "Prompts must have zero or one input."
+
+
+@pytest.mark.skip(reason="Not implemented")
+def test_serialize():
+    """Test prompt serialization."""
+    str_prompt = "This is a test prompt"
+    func_single_prompt = lambda x: f"{x} is a test prompt"
+
+    # String prompt
+    prompt = Prompt(str_prompt)
+    assert Prompt.deserialize(prompt.serialize()) == prompt
+
+    # Function single inputs
+    prompt = Prompt(func_single_prompt)
+    assert Prompt.deserialize(prompt.serialize()) == prompt