langchain/templates/anthropic-iterative-search/anthropic_iterative_search/output_parser.py

38 lines
1.2 KiB
Python
Raw Normal View History

import re
2023-10-27 02:44:30 +00:00
from langchain.schema.agent import AgentAction, AgentFinish
from .agent_scratchpad import _format_docs
def extract_between_tags(tag: str, string: str, strip: bool = True) -> str:
ext_list = re.findall(f"<{tag}\s?>(.+?)</{tag}\s?>", string, re.DOTALL)
if strip:
ext_list = [e.strip() for e in ext_list]
if ext_list:
if len(ext_list) != 1:
raise ValueError
# Only return the first one
return ext_list[0]
2023-10-27 02:44:30 +00:00
def parse_output(outputs):
partial_completion = outputs["partial_completion"]
steps = outputs["intermediate_steps"]
2023-10-27 02:44:30 +00:00
search_query = extract_between_tags(
"search_query", partial_completion + "</search_query>"
)
if search_query is None:
docs = []
str_output = ""
for action, observation in steps:
docs.extend(observation)
str_output += action.log
2023-10-27 02:44:30 +00:00
str_output += "</search_query>" + _format_docs(observation)
str_output += partial_completion
return AgentFinish({"docs": docs, "output": str_output}, log=partial_completion)
else:
2023-10-27 02:44:30 +00:00
return AgentAction(
tool="search", tool_input=search_query, log=partial_completion
)