2023-12-11 21:53:30 +00:00
|
|
|
from abc import abstractmethod
|
|
|
|
from typing import Any, Optional, Protocol, Sequence, runtime_checkable
|
|
|
|
|
|
|
|
from langchain_core.callbacks import (
|
|
|
|
AsyncCallbackManagerForToolRun,
|
|
|
|
CallbackManagerForToolRun,
|
|
|
|
)
|
|
|
|
from langchain_core.pydantic_v1 import Field
|
|
|
|
from langchain_core.tools import BaseTool
|
|
|
|
|
|
|
|
from langchain_community.llms.gradient_ai import TrainResult
|
|
|
|
|
|
|
|
|
|
|
|
@runtime_checkable
|
|
|
|
class TrainableLLM(Protocol):
|
2023-12-19 13:58:24 +00:00
|
|
|
"""Protocol for trainable language models."""
|
|
|
|
|
2023-12-11 21:53:30 +00:00
|
|
|
@abstractmethod
|
|
|
|
def train_unsupervised(
|
|
|
|
self,
|
|
|
|
inputs: Sequence[str],
|
|
|
|
**kwargs: Any,
|
|
|
|
) -> TrainResult:
|
|
|
|
...
|
|
|
|
|
|
|
|
@abstractmethod
|
|
|
|
async def atrain_unsupervised(
|
|
|
|
self,
|
|
|
|
inputs: Sequence[str],
|
|
|
|
**kwargs: Any,
|
|
|
|
) -> TrainResult:
|
|
|
|
...
|
|
|
|
|
|
|
|
|
|
|
|
class Memorize(BaseTool):
|
2023-12-19 13:58:24 +00:00
|
|
|
"""Tool that trains a language model."""
|
|
|
|
|
2024-01-25 23:24:19 +00:00
|
|
|
name: str = "memorize"
|
2023-12-11 21:53:30 +00:00
|
|
|
description: str = (
|
|
|
|
"Useful whenever you observed novel information "
|
|
|
|
"from previous conversation history, "
|
|
|
|
"i.e., another tool's action outputs or human comments. "
|
|
|
|
"The action input should include observed information in detail, "
|
|
|
|
"then the tool will fine-tune yourself to remember it."
|
|
|
|
)
|
|
|
|
llm: TrainableLLM = Field()
|
|
|
|
|
|
|
|
def _run(
|
|
|
|
self,
|
|
|
|
information_to_learn: str,
|
|
|
|
run_manager: Optional[CallbackManagerForToolRun] = None,
|
|
|
|
) -> str:
|
|
|
|
train_result = self.llm.train_unsupervised((information_to_learn,))
|
|
|
|
return f"Train complete. Loss: {train_result['loss']}"
|
|
|
|
|
|
|
|
async def _arun(
|
|
|
|
self,
|
|
|
|
information_to_learn: str,
|
|
|
|
run_manager: Optional[AsyncCallbackManagerForToolRun] = None,
|
|
|
|
) -> str:
|
|
|
|
train_result = await self.llm.atrain_unsupervised((information_to_learn,))
|
|
|
|
return f"Train complete. Loss: {train_result['loss']}"
|