2023-10-26 01:47:42 +00:00
|
|
|
import re
|
|
|
|
|
2023-10-27 02:44:30 +00:00
|
|
|
from langchain.schema.agent import AgentAction, AgentFinish
|
|
|
|
|
2023-10-26 01:47:42 +00:00
|
|
|
from .agent_scratchpad import _format_docs
|
|
|
|
|
|
|
|
|
|
|
|
def extract_between_tags(tag: str, string: str, strip: bool = True) -> str:
|
|
|
|
ext_list = re.findall(f"<{tag}\s?>(.+?)</{tag}\s?>", string, re.DOTALL)
|
|
|
|
if strip:
|
|
|
|
ext_list = [e.strip() for e in ext_list]
|
|
|
|
if ext_list:
|
|
|
|
if len(ext_list) != 1:
|
|
|
|
raise ValueError
|
|
|
|
# Only return the first one
|
|
|
|
return ext_list[0]
|
|
|
|
|
2023-10-27 02:44:30 +00:00
|
|
|
|
2023-10-26 01:47:42 +00:00
|
|
|
def parse_output(outputs):
|
|
|
|
partial_completion = outputs["partial_completion"]
|
|
|
|
steps = outputs["intermediate_steps"]
|
2023-10-27 02:44:30 +00:00
|
|
|
search_query = extract_between_tags(
|
|
|
|
"search_query", partial_completion + "</search_query>"
|
|
|
|
)
|
2023-10-26 01:47:42 +00:00
|
|
|
if search_query is None:
|
|
|
|
docs = []
|
|
|
|
str_output = ""
|
|
|
|
for action, observation in steps:
|
|
|
|
docs.extend(observation)
|
|
|
|
str_output += action.log
|
2023-10-27 02:44:30 +00:00
|
|
|
str_output += "</search_query>" + _format_docs(observation)
|
2023-10-26 01:47:42 +00:00
|
|
|
str_output += partial_completion
|
|
|
|
return AgentFinish({"docs": docs, "output": str_output}, log=partial_completion)
|
|
|
|
else:
|
2023-10-27 02:44:30 +00:00
|
|
|
return AgentAction(
|
|
|
|
tool="search", tool_input=search_query, log=partial_completion
|
|
|
|
)
|