forked from Archives/langchain
You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
105 lines
3.3 KiB
Python
105 lines
3.3 KiB
Python
"""Question answering over a graph."""
|
|
from __future__ import annotations
|
|
|
|
import re
|
|
from typing import Any, Dict, List, Optional
|
|
|
|
from pydantic import Field
|
|
|
|
from langchain.base_language import BaseLanguageModel
|
|
from langchain.callbacks.manager import CallbackManagerForChainRun
|
|
from langchain.chains.base import Chain
|
|
from langchain.chains.graph_qa.prompts import CYPHER_GENERATION_PROMPT, CYPHER_QA_PROMPT
|
|
from langchain.chains.llm import LLMChain
|
|
from langchain.graphs.neo4j_graph import Neo4jGraph
|
|
from langchain.prompts.base import BasePromptTemplate
|
|
|
|
|
|
def extract_cypher(text: str) -> str:
|
|
# The pattern to find Cypher code enclosed in triple backticks
|
|
pattern = r"```(.*?)```"
|
|
|
|
# Find all matches in the input text
|
|
matches = re.findall(pattern, text, re.DOTALL)
|
|
|
|
return matches[0] if matches else text
|
|
|
|
|
|
class GraphCypherQAChain(Chain):
|
|
"""Chain for question-answering against a graph by generating Cypher statements."""
|
|
|
|
graph: Neo4jGraph = Field(exclude=True)
|
|
cypher_generation_chain: LLMChain
|
|
qa_chain: LLMChain
|
|
input_key: str = "query" #: :meta private:
|
|
output_key: str = "result" #: :meta private:
|
|
|
|
@property
|
|
def input_keys(self) -> List[str]:
|
|
"""Return the input keys.
|
|
|
|
:meta private:
|
|
"""
|
|
return [self.input_key]
|
|
|
|
@property
|
|
def output_keys(self) -> List[str]:
|
|
"""Return the output keys.
|
|
|
|
:meta private:
|
|
"""
|
|
_output_keys = [self.output_key]
|
|
return _output_keys
|
|
|
|
@classmethod
|
|
def from_llm(
|
|
cls,
|
|
llm: BaseLanguageModel,
|
|
*,
|
|
qa_prompt: BasePromptTemplate = CYPHER_QA_PROMPT,
|
|
cypher_prompt: BasePromptTemplate = CYPHER_GENERATION_PROMPT,
|
|
**kwargs: Any,
|
|
) -> GraphCypherQAChain:
|
|
"""Initialize from LLM."""
|
|
qa_chain = LLMChain(llm=llm, prompt=qa_prompt)
|
|
cypher_generation_chain = LLMChain(llm=llm, prompt=cypher_prompt)
|
|
|
|
return cls(
|
|
qa_chain=qa_chain,
|
|
cypher_generation_chain=cypher_generation_chain,
|
|
**kwargs,
|
|
)
|
|
|
|
def _call(
|
|
self,
|
|
inputs: Dict[str, Any],
|
|
run_manager: Optional[CallbackManagerForChainRun] = None,
|
|
) -> Dict[str, str]:
|
|
"""Generate Cypher statement, use it to look up in db and answer question."""
|
|
_run_manager = run_manager or CallbackManagerForChainRun.get_noop_manager()
|
|
callbacks = _run_manager.get_child()
|
|
question = inputs[self.input_key]
|
|
|
|
generated_cypher = self.cypher_generation_chain.run(
|
|
{"question": question, "schema": self.graph.get_schema}, callbacks=callbacks
|
|
)
|
|
|
|
# Extract Cypher code if it is wrapped in backticks
|
|
generated_cypher = extract_cypher(generated_cypher)
|
|
|
|
_run_manager.on_text("Generated Cypher:", end="\n", verbose=self.verbose)
|
|
_run_manager.on_text(
|
|
generated_cypher, color="green", end="\n", verbose=self.verbose
|
|
)
|
|
context = self.graph.query(generated_cypher)
|
|
|
|
_run_manager.on_text("Full Context:", end="\n", verbose=self.verbose)
|
|
_run_manager.on_text(
|
|
str(context), color="green", end="\n", verbose=self.verbose
|
|
)
|
|
result = self.qa_chain(
|
|
{"question": question, "context": context},
|
|
callbacks=callbacks,
|
|
)
|
|
return {self.output_key: result[self.qa_chain.output_key]}
|