langchain/templates/extraction-openai-functions/extraction_openai_functions/chain.py

import json
from typing import List, Optional

from langchain.chat_models import ChatOpenAI
from langchain.prompts import ChatPromptTemplate
from langchain.pydantic_v1 import BaseModel
from langchain.utils.openai_functions import convert_pydantic_to_openai_function

template = """A article will be passed to you. Extract from it all papers that are mentioned by this article. 

Do not extract the name of the article itself. If no papers are mentioned that's fine - you don't need to extract any! Just return an empty list.

Do not make up or guess ANY extra information. Only extract what exactly is in the text."""  # noqa: E501

prompt = ChatPromptTemplate.from_messages([("system", template), ("human", "{input}")])


# Function output schema
class Paper(BaseModel):
    """Information about papers mentioned."""

    title: str
    author: Optional[str]


class Info(BaseModel):
    """Information to extract"""

    papers: List[Paper]


# Function definition
model = ChatOpenAI()
function = [convert_pydantic_to_openai_function(Info)]
chain = (
    prompt
    | model.bind(functions=function, function_call={"name": "Info"})
    | (
        lambda x: json.loads(x.additional_kwargs["function_call"]["arguments"])[
            "papers"
        ]
    )
)

# chain = prompt | model.bind(
#     functions=function, function_call={"name": "Info"}
# ) | JsonKeyOutputFunctionsParser(key_name="papers")
Format Templates (#12396) 2023-10-27 02:44:30 +00:00			`import json`
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00			`from typing import List, Optional`
Format Templates (#12396) 2023-10-27 02:44:30 +00:00
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00			`from langchain.chat_models import ChatOpenAI`
			`from langchain.prompts import ChatPromptTemplate`
Format Templates (#12396) 2023-10-27 02:44:30 +00:00			`from langchain.pydantic_v1 import BaseModel`
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00			`from langchain.utils.openai_functions import convert_pydantic_to_openai_function`

			`template = """A article will be passed to you. Extract from it all papers that are mentioned by this article.`

			`Do not extract the name of the article itself. If no papers are mentioned that's fine - you don't need to extract any! Just return an empty list.`

Format Templates (#12396) 2023-10-27 02:44:30 +00:00			`Do not make up or guess ANY extra information. Only extract what exactly is in the text.""" # noqa: E501`

			`prompt = ChatPromptTemplate.from_messages([("system", template), ("human", "{input}")])`
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00

			`# Function output schema`
			`class Paper(BaseModel):`
			`"""Information about papers mentioned."""`
Format Templates (#12396) 2023-10-27 02:44:30 +00:00
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00			`title: str`
			`author: Optional[str]`


			`class Info(BaseModel):`
			`"""Information to extract"""`
Format Templates (#12396) 2023-10-27 02:44:30 +00:00
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00			`papers: List[Paper]`

Format Templates (#12396) 2023-10-27 02:44:30 +00:00
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00			`# Function definition`
			`model = ChatOpenAI()`
			`function = [convert_pydantic_to_openai_function(Info)]`
Format Templates (#12396) 2023-10-27 02:44:30 +00:00			`chain = (`
			`prompt`
			`\| model.bind(functions=function, function_call={"name": "Info"})`
			`\| (`
			`lambda x: json.loads(x.additional_kwargs["function_call"]["arguments"])[`
			`"papers"`
			`]`
			`)`
			`)`
Templates (#12294) Co-authored-by: Harrison Chase <hw.chase.17@gmail.com> Co-authored-by: Lance Martin <lance@langchain.dev> Co-authored-by: Jacob Lee <jacoblee93@gmail.com> 2023-10-26 01:47:42 +00:00
			`# chain = prompt \| model.bind(`
			`# functions=function, function_call={"name": "Info"}`
			`# ) \| JsonKeyOutputFunctionsParser(key_name="papers")`