establish router

2 years ago · 6f55fa8ba7
parent 8869b0ab0e
commit 6f55fa8ba7
9 changed files with 228 additions and 186 deletions
--- a/docs/examples/demos/mrkl.ipynb
+++ b/docs/examples/demos/mrkl.ipynb
@ -32,7 +32,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 2,
   "id": "07e96d99",
   "metadata": {},
   "outputs": [],
@ -64,7 +64,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 3,
   "id": "a069c4b6",
   "metadata": {},
   "outputs": [],
@ -74,7 +74,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 4,
   "id": "e603cd7d",
   "metadata": {},
   "outputs": [
@ -86,32 +86,32 @@
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
      "What is the age of Olivia Wilde's boyfriend raised to the 0.23 power?\n",
-      "Thought:\u001b[102m I need to find the age of Olivia Wilde's boyfriend\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I need to find the age of Olivia Wilde's boyfriend\n",
      "Action: Search\n",
      "Action Input: \"Olivia Wilde's boyfriend\"\u001b[0m\n",
-      "Observation: \u001b[104mOlivia Wilde started dating Harry Styles after ending her years-long engagement to Jason Sudeikis — see their relationship timeline.\u001b[0m\n",
-      "Thought:\u001b[102m I need to find the age of Harry Styles\n",
+      "Observation: \u001b[36;1m\u001b[1;3mOlivia Wilde started dating Harry Styles after ending her years-long engagement to Jason Sudeikis — see their relationship timeline.\u001b[0m\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I need to find the age of Harry Styles\n",
      "Action: Search\n",
      "Action Input: \"Harry Styles age\"\u001b[0m\n",
-      "Observation: \u001b[104m28 years\u001b[0m\n",
-      "Thought:\u001b[102m I need to calculate 28 to the 0.23 power\n",
+      "Observation: \u001b[36;1m\u001b[1;3m28 years\u001b[0m\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I need to calculate 28 to the 0.23 power\n",
      "Action: Calculator\n",
      "Action Input: 28^0.23\u001b[0m\n",
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
-      "28^0.23\u001b[102m\n",
+      "28^0.23\u001b[32;1m\u001b[1;3m\n",
      "\n",
      "```python\n",
      "print(28**0.23)\n",
      "```\n",
      "\u001b[0m\n",
-      "Answer: \u001b[103m2.1520202182226886\n",
+      "Answer: \u001b[33;1m\u001b[1;3m2.1520202182226886\n",
      "\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n",
      "\n",
-      "Observation: \u001b[103mAnswer: 2.1520202182226886\n",
+      "Observation: \u001b[33;1m\u001b[1;3mAnswer: 2.1520202182226886\n",
      "\u001b[0m\n",
-      "Thought:\u001b[102m I now know the final answer\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I now know the final answer\n",
      "Final Answer: 2.1520202182226886\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n"
     ]
@ -122,7 +122,7 @@
       "'2.1520202182226886'"
      ]
     },
-     "execution_count": 6,
+     "execution_count": 4,
     "metadata": {},
     "output_type": "execute_result"
    }
@ -133,7 +133,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 5,
   "id": "a5c07010",
   "metadata": {},
   "outputs": [
@ -145,35 +145,35 @@
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
      "Who recently released an album called 'The Storm Before the Calm' and are they in the FooBar database? If so, what albums of theirs are in the FooBar database?\n",
-      "Thought:\u001b[102m I need to find an album called 'The Storm Before the Calm'\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I need to find an album called 'The Storm Before the Calm'\n",
      "Action: Search\n",
      "Action Input: \"The Storm Before the Calm album\"\u001b[0m\n",
-      "Observation: \u001b[104mThe Storm Before the Calm (stylized in all lowercase) is the tenth (and eighth international) studio album by Canadian-American singer-songwriter Alanis ...\u001b[0m\n",
-      "Thought:\u001b[102m I need to check if Alanis is in the FooBar database\n",
+      "Observation: \u001b[36;1m\u001b[1;3mThe Storm Before the Calm (stylized in all lowercase) is the tenth (and eighth international) studio album by Canadian-American singer-songwriter Alanis ...\u001b[0m\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I need to check if Alanis is in the FooBar database\n",
      "Action: FooBar DB\n",
      "Action Input: \"Does Alanis Morissette exist in the FooBar database?\"\u001b[0m\n",
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
      "Does Alanis Morissette exist in the FooBar database?\n",
-      "SQLQuery:\u001b[102m SELECT * FROM Artist WHERE Name = 'Alanis Morissette'\u001b[0m\n",
-      "SQLResult: \u001b[103m[(4, 'Alanis Morissette')]\u001b[0m\n",
-      "Answer:\u001b[102m Yes\u001b[0m\n",
+      "SQLQuery:\u001b[32;1m\u001b[1;3m SELECT * FROM Artist WHERE Name = 'Alanis Morissette'\u001b[0m\n",
+      "SQLResult: \u001b[33;1m\u001b[1;3m[(4, 'Alanis Morissette')]\u001b[0m\n",
+      "Answer:\u001b[32;1m\u001b[1;3m Yes\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n",
      "\n",
-      "Observation: \u001b[101m Yes\u001b[0m\n",
-      "Thought:\u001b[102m I need to find out what albums of Alanis's are in the FooBar database\n",
+      "Observation: \u001b[38;5;200m\u001b[1;3m Yes\u001b[0m\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I need to find out what albums of Alanis's are in the FooBar database\n",
      "Action: FooBar DB\n",
      "Action Input: \"What albums by Alanis Morissette are in the FooBar database?\"\u001b[0m\n",
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
      "What albums by Alanis Morissette are in the FooBar database?\n",
-      "SQLQuery:\u001b[102m SELECT Title FROM Album WHERE ArtistId = (SELECT ArtistId FROM Artist WHERE Name = 'Alanis Morissette')\u001b[0m\n",
-      "SQLResult: \u001b[103m[('Jagged Little Pill',)]\u001b[0m\n",
-      "Answer:\u001b[102m Jagged Little Pill\u001b[0m\n",
+      "SQLQuery:\u001b[32;1m\u001b[1;3m SELECT Album.Title FROM Album JOIN Artist ON Album.ArtistId = Artist.ArtistId WHERE Artist.Name = 'Alanis Morissette'\u001b[0m\n",
+      "SQLResult: \u001b[33;1m\u001b[1;3m[('Jagged Little Pill',)]\u001b[0m\n",
+      "Answer:\u001b[32;1m\u001b[1;3m Jagged Little Pill\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n",
      "\n",
-      "Observation: \u001b[101m Jagged Little Pill\u001b[0m\n",
-      "Thought:\u001b[102m I now know the final answer\n",
+      "Observation: \u001b[38;5;200m\u001b[1;3m Jagged Little Pill\u001b[0m\n",
+      "Thought:\u001b[32;1m\u001b[1;3m I now know the final answer\n",
      "Final Answer: The album is by Alanis Morissette and the albums in the FooBar database by her are Jagged Little Pill\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n"
     ]
@ -184,7 +184,7 @@
       "'The album is by Alanis Morissette and the albums in the FooBar database by her are Jagged Little Pill'"
      ]
     },
-     "execution_count": 10,
+     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
--- a/docs/examples/demos/react.ipynb
+++ b/docs/examples/demos/react.ipynb
@ -37,14 +37,14 @@
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
      "Author David Chanoff has collaborated with a U.S. Navy admiral who served as the ambassador to the United Kingdom under which President?\n",
-      "Thought 1:\u001b[102m I need to search David Chanoff and find the U.S. Navy admiral he\n",
-      "collaborated with.\n",
+      "Thought 1:\u001b[32;1m\u001b[1;3m I need to search David Chanoff and find the U.S. Navy admiral he collaborated\n",
+      "with.\n",
      "Action 1: Search[David Chanoff]\u001b[0m\n",
-      "Observation 1: \u001b[103mDavid Chanoff is a noted author of non-fiction work. His work has typically involved collaborations with the principal protagonist of the work concerned. His collaborators have included; Augustus A. White, Joycelyn Elders, Đoàn Văn Toại, William J. Crowe, Ariel Sharon, Kenneth Good and Felix Zandman. He has also written about a wide range of subjects including literary history, education and foreign for The Washington Post, The New Republic and The New York Times Magazine. He has published more than twelve books.\u001b[0m\n",
-      "Thought 2:\u001b[102m The U.S. Navy admiral David Chanoff collaborated with is William J. Crowe.\n",
+      "Observation 1: \u001b[33;1m\u001b[1;3mDavid Chanoff is a noted author of non-fiction work. His work has typically involved collaborations with the principal protagonist of the work concerned. His collaborators have included; Augustus A. White, Joycelyn Elders, Đoàn Văn Toại, William J. Crowe, Ariel Sharon, Kenneth Good and Felix Zandman. He has also written about a wide range of subjects including literary history, education and foreign for The Washington Post, The New Republic and The New York Times Magazine. He has published more than twelve books.\u001b[0m\n",
+      "Thought 2:\u001b[32;1m\u001b[1;3m The U.S. Navy admiral David Chanoff collaborated with is William J. Crowe.\n",
      "Action 2: Search[William J. Crowe]\u001b[0m\n",
-      "Observation 2: \u001b[103mWilliam James Crowe Jr. (January 2, 1925 – October 18, 2007) was a United States Navy admiral and diplomat who served as the 11th chairman of the Joint Chiefs of Staff under Presidents Ronald Reagan and George H. W. Bush, and as the ambassador to the United Kingdom and Chair of the Intelligence Oversight Board under President Bill Clinton.\u001b[0m\n",
-      "Thought 3:\u001b[102m William J. Crowe served as the ambassador to the United Kingdom under President Bill Clinton. So the answer is Bill Clinton.\n",
+      "Observation 2: \u001b[33;1m\u001b[1;3mWilliam James Crowe Jr. (January 2, 1925 – October 18, 2007) was a United States Navy admiral and diplomat who served as the 11th chairman of the Joint Chiefs of Staff under Presidents Ronald Reagan and George H. W. Bush, and as the ambassador to the United Kingdom and Chair of the Intelligence Oversight Board under President Bill Clinton.\u001b[0m\n",
+      "Thought 3:\u001b[32;1m\u001b[1;3m William J. Crowe served as the ambassador to the United Kingdom under President Bill Clinton.\n",
      "Action 3: Finish[Bill Clinton]\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n"
     ]
@ -68,7 +68,7 @@
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "0a6bd3b4",
+   "id": "b5a265c6",
   "metadata": {},
   "outputs": [],
   "source": []
--- a/docs/examples/demos/self_ask_with_search.ipynb
+++ b/docs/examples/demos/self_ask_with_search.ipynb
@ -24,19 +24,19 @@
      "\n",
      "\u001b[1m> Entering new chain...\u001b[0m\n",
      "What is the hometown of the reigning men's U.S. Open champion?\n",
-      "Are follow up questions needed here:\u001b[102m Yes.\n",
+      "Are follow up questions needed here:\u001b[32;1m\u001b[1;3m Yes.\n",
      "Follow up: Who is the reigning men's U.S. Open champion?\u001b[0m\n",
-      "Intermediate answer: \u001b[103mCarlos Alcaraz won the 2022 Men's single title while Poland's Iga Swiatek won the Women's single title defeating Tunisian's Ons Jabeur..\u001b[0m\u001b[102m\n",
+      "Intermediate answer: \u001b[33;1m\u001b[1;3mCarlos Alcaraz.\u001b[0m\u001b[32;1m\u001b[1;3m\n",
      "Follow up: Where is Carlos Alcaraz from?\u001b[0m\n",
-      "Intermediate answer: \u001b[103mEl Palmar, Murcia, Spain.\u001b[0m\u001b[102m\n",
-      "So the final answer is: El Palmar, Murcia, Spain\u001b[0m\n",
+      "Intermediate answer: \u001b[33;1m\u001b[1;3mEl Palmar, Spain.\u001b[0m\u001b[32;1m\u001b[1;3m\n",
+      "So the final answer is: El Palmar, Spain\u001b[0m\n",
      "\u001b[1m> Finished chain.\u001b[0m\n"
     ]
    },
    {
     "data": {
      "text/plain": [
-       "'\\nSo the final answer is: El Palmar, Murcia, Spain'"
+       "'\\nSo the final answer is: El Palmar, Spain'"
      ]
     },
     "execution_count": 1,
--- a/langchain/chains/mrkl/base.py
+++ b/langchain/chains/mrkl/base.py
@ -1,14 +1,15 @@
 """Attempt to implement MRKL systems as described in arxiv.org/pdf/2205.00445.pdf."""
-from typing import Any, Callable, Dict, List, NamedTuple, Tuple
+from typing import Any, Callable, Dict, List, NamedTuple, Optional, Tuple

 from pydantic import BaseModel, Extra

 from langchain.chains.base import Chain
 from langchain.chains.llm import LLMChain
 from langchain.chains.mrkl.prompt import BASE_TEMPLATE
+from langchain.chains.router import LLMRouterChain
 from langchain.input import ChainedInput, get_color_mapping
 from langchain.llms.base import LLM
-from langchain.prompts import BasePrompt, Prompt
+from langchain.prompts import Prompt

 FINAL_ANSWER_ACTION = "Final Answer: "

@ -48,6 +49,25 @@ def get_action_and_input(llm_output: str) -> Tuple[str, str]:
    return action, action_input.strip(" ").strip('"')


+class MRKLRouterChain(LLMRouterChain):
+    """Router for the MRKL chain."""
+
+    def __init__(self, llm: LLM, chain_configs: List[ChainConfig], **kwargs: Any):
+        """Initialize with an LLM and the chain configs it has access to."""
+        tools = "\n".join(
+            [f"{c.action_name}: {c.action_description}" for c in chain_configs]
+        )
+        tool_names = ", ".join([chain.action_name for chain in chain_configs])
+        template = BASE_TEMPLATE.format(tools=tools, tool_names=tool_names)
+        prompt = Prompt(template=template, input_variables=["input"])
+        llm_chain = LLMChain(llm=llm, prompt=prompt)
+        stops = ["\nObservation"]
+        super().__init__(llm_chain=llm_chain, stops=stops, **kwargs)
+
+    def _extract_action_and_input(self, text: str) -> Optional[Tuple[str, str]]:
+        return get_action_and_input(text)
+
+
 class MRKLChain(Chain, BaseModel):
    """Chain that implements the MRKL system.

@ -68,8 +88,8 @@ class MRKLChain(Chain, BaseModel):

    llm: LLM
    """LLM wrapper to use as router."""
-    prompt: BasePrompt
-    """Prompt to use as router."""
+    chain_configs: List[ChainConfig]
+    """Chain configs this chain has access to."""
    action_to_chain_map: Dict[str, Callable]
    """Mapping from action name to chain to execute."""
    input_key: str = "question"  #: :meta private:
@ -114,15 +134,12 @@ class MRKLChain(Chain, BaseModel):
                ]
                mrkl = MRKLChain.from_chains(llm, chains)
        """
-        tools = "\n".join(
-            [f"{chain.action_name}: {chain.action_description}" for chain in chains]
-        )
-        tool_names = ", ".join([chain.action_name for chain in chains])
-        template = BASE_TEMPLATE.format(tools=tools, tool_names=tool_names)
-        prompt = Prompt(template=template, input_variables=["input"])
        action_to_chain_map = {chain.action_name: chain.action for chain in chains}
        return cls(
-            llm=llm, prompt=prompt, action_to_chain_map=action_to_chain_map, **kwargs
+            llm=llm,
+            chain_configs=chains,
+            action_to_chain_map=action_to_chain_map,
+            **kwargs,
        )

    class Config:
@ -148,7 +165,7 @@ class MRKLChain(Chain, BaseModel):
        return [self.output_key]

    def _call(self, inputs: Dict[str, str]) -> Dict[str, str]:
-        llm_chain = LLMChain(llm=self.llm, prompt=self.prompt)
+        router_chain = MRKLRouterChain(self.llm, self.chain_configs)
        chained_input = ChainedInput(
            f"{inputs[self.input_key]}\nThought:", verbose=self.verbose
        )
@ -156,11 +173,10 @@ class MRKLChain(Chain, BaseModel):
            list(self.action_to_chain_map.keys()), excluded_colors=["green"]
        )
        while True:
-            thought = llm_chain.predict(
-                input=chained_input.input, stop=["\nObservation"]
+            action, action_input, thought = router_chain.get_action_and_input(
+                chained_input.input
            )
            chained_input.add(thought, color="green")
-            action, action_input = get_action_and_input(thought)
            if action == FINAL_ANSWER_ACTION:
                return {self.output_key: action_input}
            chain = self.action_to_chain_map[action]
--- a/langchain/chains/react/base.py
+++ b/langchain/chains/react/base.py
@ -1,38 +1,47 @@
 """Chain that implements the ReAct paper from https://arxiv.org/pdf/2210.03629.pdf."""
 import re
-from typing import Any, Dict, List, Tuple
+from typing import Any, Dict, List, Optional, Tuple

 from pydantic import BaseModel, Extra

 from langchain.chains.base import Chain
 from langchain.chains.llm import LLMChain
 from langchain.chains.react.prompt import PROMPT
+from langchain.chains.router import LLMRouterChain
 from langchain.docstore.base import Docstore
 from langchain.docstore.document import Document
 from langchain.input import ChainedInput
 from langchain.llms.base import LLM


-def predict_until_observation(
-    llm_chain: LLMChain, prompt: str, i: int
-) -> Tuple[str, str, str]:
-    """Generate text until an observation is needed."""
-    action_prefix = f"Action {i}: "
-    stop_seq = f"\nObservation {i}:"
-    ret_text = llm_chain.predict(input=prompt, stop=[stop_seq])
-    # Sometimes the LLM forgets to take an action, so we prompt it to.
-    while not ret_text.split("\n")[-1].startswith(action_prefix):
-        ret_text += f"\nAction {i}:"
-        new_text = llm_chain.predict(input=prompt + ret_text, stop=[stop_seq])
-        ret_text += new_text
-    # The action block should be the last line.
-    action_block = ret_text.split("\n")[-1]
-    action_str = action_block[len(action_prefix) :]
-    # Parse out the action and the directive.
-    re_matches = re.search(r"(.*?)\[(.*?)\]", action_str)
-    if re_matches is None:
-        raise ValueError(f"Could not parse action directive: {action_str}")
-    return ret_text, re_matches.group(1), re_matches.group(2)
+class ReActRouterChain(LLMRouterChain, BaseModel):
+    """Router for the ReAct chin."""
+
+    i: int = 1
+
+    def __init__(self, llm: LLM, **kwargs: Any):
+        """Initialize with the language model."""
+        llm_chain = LLMChain(llm=llm, prompt=PROMPT)
+        stops = ["\nObservation 1:"]
+        super().__init__(llm_chain=llm_chain, stops=stops, **kwargs)
+
+    def _fix_text(self, text: str) -> str:
+        return text + f"\nAction {self.i}:"
+
+    def _extract_action_and_input(self, text: str) -> Optional[Tuple[str, str]]:
+        action_prefix = f"Action {self.i}: "
+        if not text.split("\n")[-1].startswith(action_prefix):
+            return None
+        self.i += 1
+        self.stops = [f"\nObservation {self.i}:"]
+        action_block = text.split("\n")[-1]
+
+        action_str = action_block[len(action_prefix) :]
+        # Parse out the action and the directive.
+        re_matches = re.search(r"(.*?)\[(.*?)\]", action_str)
+        if re_matches is None:
+            raise ValueError(f"Could not parse action directive: {action_str}")
+        return re_matches.group(1), re_matches.group(2)


 class ReActChain(Chain, BaseModel):
@ -76,13 +85,12 @@ class ReActChain(Chain, BaseModel):

    def _call(self, inputs: Dict[str, Any]) -> Dict[str, str]:
        question = inputs[self.input_key]
-        llm_chain = LLMChain(llm=self.llm, prompt=PROMPT)
+        router_chain = ReActRouterChain(self.llm)
        chained_input = ChainedInput(f"{question}\nThought 1:", verbose=self.verbose)
-        i = 1
        document = None
        while True:
-            ret_text, action, directive = predict_until_observation(
-                llm_chain, chained_input.input, i
+            action, directive, ret_text = router_chain.get_action_and_input(
+                chained_input.input
            )
            chained_input.add(ret_text, color="green")
            if action == "Search":
@ -101,7 +109,6 @@ class ReActChain(Chain, BaseModel):
                return {self.output_key: directive}
            else:
                raise ValueError(f"Got unknown action directive: {action}")
-            chained_input.add(f"\nObservation {i}: ")
+            chained_input.add(f"\nObservation {router_chain.i - 1}: ")
            chained_input.add(observation, color="yellow")
-            chained_input.add(f"\nThought {i + 1}:")
-            i += 1
+            chained_input.add(f"\nThought {router_chain.i}:")
--- a/langchain/chains/router.py
+++ b/langchain/chains/router.py
@ -0,0 +1,75 @@
+"""Chain that takes in an input and produces an action and action input."""
+from abc import ABC, abstractmethod
+from typing import Dict, List, Optional, Tuple
+
+from pydantic import BaseModel
+
+from langchain.chains.base import Chain
+from langchain.chains.llm import LLMChain
+
+
+class RouterChain(Chain, BaseModel, ABC):
+    """Chain responsible for deciding the action to take."""
+
+    input_key: str = "input_text"  #: :meta private:
+    action_key: str = "action"  #: :meta private:
+    action_input_key: str = "action_input"  #: :meta private:
+    log_key: str = "log"  #: :meta private:
+
+    @property
+    def input_keys(self) -> List[str]:
+        """Will be the input key.
+
+        :meta private:
+        """
+        return [self.input_key]
+
+    @property
+    def output_keys(self) -> List[str]:
+        """Return three keys: the action, the action input, and the log.
+
+        :meta private:
+        """
+        return [self.action_key, self.action_input_key, self.log_key]
+
+    @abstractmethod
+    def get_action_and_input(self, text: str) -> Tuple[str, str, str]:
+        """Return action, action input, and log (in that order)."""
+
+    def _call(self, inputs: Dict[str, str]) -> Dict[str, str]:
+        action, action_input, log = self.get_action_and_input(inputs[self.input_key])
+        return {
+            self.action_key: action,
+            self.action_input_key: action_input,
+            self.log_key: log,
+        }
+
+
+class LLMRouterChain(RouterChain, BaseModel, ABC):
+    """RouterChain that uses an LLM."""
+
+    llm_chain: LLMChain
+    stops: Optional[List[str]]
+
+    @abstractmethod
+    def _extract_action_and_input(self, text: str) -> Optional[Tuple[str, str]]:
+        """Extract action and action input from llm output."""
+
+    def _fix_text(self, text: str) -> str:
+        """Fix the text."""
+        raise ValueError("fix_text not implemented for this router.")
+
+    def get_action_and_input(self, text: str) -> Tuple[str, str, str]:
+        """Return action, action input, and log (in that order)."""
+        input_key = self.llm_chain.input_keys[0]
+        inputs = {input_key: text, "stop": self.stops}
+        full_output = self.llm_chain.predict(**inputs)
+        parsed_output = self._extract_action_and_input(full_output)
+        while parsed_output is None:
+            full_output = self._fix_text(full_output)
+            inputs = {input_key: text + full_output, "stop": self.stops}
+            output = self.llm_chain.predict(**inputs)
+            full_output += output
+            parsed_output = self._extract_action_and_input(full_output)
+        action, action_input = parsed_output
+        return action, action_input, full_output
--- a/langchain/chains/self_ask_with_search/base.py
+++ b/langchain/chains/self_ask_with_search/base.py
@ -1,77 +1,46 @@
 """Chain that does self ask with search."""
-from typing import Any, Dict, List
+from typing import Any, Dict, List, Tuple

 from pydantic import BaseModel, Extra

 from langchain.chains.base import Chain
 from langchain.chains.llm import LLMChain
+from langchain.chains.router import LLMRouterChain
 from langchain.chains.self_ask_with_search.prompt import PROMPT
 from langchain.chains.serpapi import SerpAPIChain
 from langchain.input import ChainedInput
 from langchain.llms.base import LLM


-def extract_answer(generated: str) -> str:
-    """Extract answer from text."""
-    if "\n" not in generated:
-        last_line = generated
-    else:
-        last_line = generated.split("\n")[-1]
+class SelfAskWithSearchRouter(LLMRouterChain):
+    """Router for the self-ask-with-search paper."""

-    if ":" not in last_line:
-        after_colon = last_line
-    else:
-        after_colon = generated.split(":")[-1]
+    def __init__(self, llm: LLM, **kwargs: Any):
+        """Initialize with an LLM."""
+        llm_chain = LLMChain(llm=llm, prompt=PROMPT)
+        super().__init__(llm_chain=llm_chain, **kwargs)

-    if " " == after_colon[0]:
-        after_colon = after_colon[1:]
-    if "." == after_colon[-1]:
-        after_colon = after_colon[:-1]
-
-    return after_colon
-
-
-def extract_question(generated: str, followup: str) -> str:
-    """Extract question from text."""
-    if "\n" not in generated:
-        last_line = generated
-    else:
-        last_line = generated.split("\n")[-1]
-
-    if followup not in last_line:
-        print("we probably should never get here..." + generated)
-
-    if ":" not in last_line:
-        after_colon = last_line
-    else:
-        after_colon = generated.split(":")[-1]
-
-    if " " == after_colon[0]:
-        after_colon = after_colon[1:]
-    if "?" != after_colon[-1]:
-        print("we probably should never get here..." + generated)
-
-    return after_colon
-
-
-def get_last_line(generated: str) -> str:
-    """Get the last line in text."""
-    if "\n" not in generated:
-        last_line = generated
-    else:
-        last_line = generated.split("\n")[-1]
-
-    return last_line
+    def _extract_action_and_input(self, text: str) -> Tuple[str, str]:
+        followup = "Follow up:"
+        if "\n" not in text:
+            last_line = text
+        else:
+            last_line = text.split("\n")[-1]

+        if followup not in last_line:
+            return "Final Answer", text

-def greenify(_input: str) -> str:
-    """Add green highlighting to text."""
-    return "\x1b[102m" + _input + "\x1b[0m"
+        if ":" not in last_line:
+            after_colon = last_line
+        else:
+            after_colon = text.split(":")[-1]

+        if " " == after_colon[0]:
+            after_colon = after_colon[1:]
+        if "?" != after_colon[-1]:
+            print("we probably should never get here..." + text)

-def yellowfy(_input: str) -> str:
-    """Add yellow highlighting to text."""
-    return "\x1b[106m" + _input + "\x1b[0m"
+        return "Intermediate Answer", after_colon


 class SelfAskWithSearchChain(Chain, BaseModel):
@ -117,33 +86,14 @@ class SelfAskWithSearchChain(Chain, BaseModel):
    def _call(self, inputs: Dict[str, Any]) -> Dict[str, str]:
        chained_input = ChainedInput(inputs[self.input_key], verbose=self.verbose)
        chained_input.add("\nAre follow up questions needed here:")
-        llm_chain = LLMChain(llm=self.llm, prompt=PROMPT)
        intermediate = "\nIntermediate answer:"
-        followup = "Follow up:"
-        finalans = "\nSo the final answer is:"
-        ret_text = llm_chain.predict(input=chained_input.input, stop=[intermediate])
-        chained_input.add(ret_text, color="green")
-        while followup in get_last_line(ret_text):
-            question = extract_question(ret_text, followup)
-            external_answer = self.search_chain.run(question)
-            if external_answer is not None:
-                chained_input.add(intermediate + " ")
-                chained_input.add(external_answer + ".", color="yellow")
-                ret_text = llm_chain.predict(
-                    input=chained_input.input, stop=["\nIntermediate answer:"]
-                )
-                chained_input.add(ret_text, color="green")
-            else:
-                # We only get here in the very rare case that Google returns no answer.
-                chained_input.add(intermediate + " ")
-                preds = llm_chain.predict(
-                    input=chained_input.input, stop=["\n" + followup, finalans]
-                )
-                chained_input.add(preds, color="green")
-
-        if finalans not in ret_text:
-            chained_input.add(finalans)
-            ret_text = llm_chain.predict(input=chained_input.input, stop=["\n"])
-            chained_input.add(ret_text, color="green")
-
-        return {self.output_key: ret_text}
+        router = SelfAskWithSearchRouter(self.llm, stops=[intermediate])
+        action, action_input, log = router.get_action_and_input(chained_input.input)
+        chained_input.add(log, color="green")
+        while action != "Final Answer":
+            external_answer = self.search_chain.run(action_input)
+            chained_input.add(intermediate + " ")
+            chained_input.add(external_answer + ".", color="yellow")
+            action, action_input, log = router.get_action_and_input(chained_input.input)
+            chained_input.add(log, color="green")
+        return {self.output_key: action_input}
--- a/tests/unit_tests/chains/test_mrkl.py
+++ b/tests/unit_tests/chains/test_mrkl.py
@ -2,7 +2,11 @@

 import pytest

-from langchain.chains.mrkl.base import ChainConfig, MRKLChain, get_action_and_input
+from langchain.chains.mrkl.base import (
+    ChainConfig,
+    MRKLRouterChain,
+    get_action_and_input,
+)
 from langchain.chains.mrkl.prompt import BASE_TEMPLATE
 from langchain.prompts import Prompt
 from tests.unit_tests.llms.fake_llm import FakeLLM
@ -59,12 +63,12 @@ def test_from_chains() -> None:
            action_name="bar", action=lambda x: "bar", action_description="foobar2"
        ),
    ]
-    mrkl_chain = MRKLChain.from_chains(FakeLLM(), chain_configs)
+    router_chain = MRKLRouterChain(FakeLLM(), chain_configs)
    expected_tools_prompt = "foo: foobar1\nbar: foobar2"
    expected_tool_names = "foo, bar"
    expected_template = BASE_TEMPLATE.format(
        tools=expected_tools_prompt, tool_names=expected_tool_names
    )
-    prompt = mrkl_chain.prompt
+    prompt = router_chain.llm_chain.prompt
    assert isinstance(prompt, Prompt)
    assert prompt.template == expected_template
--- a/tests/unit_tests/chains/test_react.py
+++ b/tests/unit_tests/chains/test_react.py
@ -4,8 +4,7 @@ from typing import Any, List, Mapping, Optional, Union

 import pytest

-from langchain.chains.llm import LLMChain
-from langchain.chains.react.base import ReActChain, predict_until_observation
+from langchain.chains.react.base import ReActChain, ReActRouterChain
 from langchain.docstore.base import Docstore
 from langchain.docstore.document import Document
 from langchain.llms.base import LLM
@ -53,8 +52,8 @@ def test_predict_until_observation_normal() -> None:
    """Test predict_until_observation when observation is made normally."""
    outputs = ["foo\nAction 1: search[foo]"]
    fake_llm = FakeListLLM(outputs)
-    fake_llm_chain = LLMChain(llm=fake_llm, prompt=_FAKE_PROMPT)
-    ret_text, action, directive = predict_until_observation(fake_llm_chain, "", 1)
+    router_chain = ReActRouterChain(llm=fake_llm)
+    action, directive, ret_text = router_chain.get_action_and_input("")
    assert ret_text == outputs[0]
    assert action == "search"
    assert directive == "foo"
@ -64,22 +63,13 @@ def test_predict_until_observation_repeat() -> None:
    """Test when no action is generated initially."""
    outputs = ["foo", " search[foo]"]
    fake_llm = FakeListLLM(outputs)
-    fake_llm_chain = LLMChain(llm=fake_llm, prompt=_FAKE_PROMPT)
-    ret_text, action, directive = predict_until_observation(fake_llm_chain, "", 1)
+    router_chain = ReActRouterChain(llm=fake_llm)
+    action, directive, ret_text = router_chain.get_action_and_input("")
    assert ret_text == "foo\nAction 1: search[foo]"
    assert action == "search"
    assert directive == "foo"


-def test_predict_until_observation_error() -> None:
-    """Test handling of generation of text that cannot be parsed."""
-    outputs = ["foo\nAction 1: foo"]
-    fake_llm = FakeListLLM(outputs)
-    fake_llm_chain = LLMChain(llm=fake_llm, prompt=_FAKE_PROMPT)
-    with pytest.raises(ValueError):
-        predict_until_observation(fake_llm_chain, "", 1)
-
-
 def test_react_chain() -> None:
    """Test react chain."""
    responses = [