2023-09-21 18:10:59 +00:00
|
|
|
from __future__ import annotations
|
|
|
|
|
2023-10-17 07:29:12 +00:00
|
|
|
import asyncio
|
2023-09-21 18:10:59 +00:00
|
|
|
import random
|
2024-02-21 23:16:58 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
from ..typing import Type, List, CreateResult, Messages, Iterator
|
|
|
|
from .types import BaseProvider, BaseRetryProvider
|
2023-10-22 21:53:18 +00:00
|
|
|
from .. import debug
|
2023-12-10 23:56:06 +00:00
|
|
|
from ..errors import RetryProviderError, RetryNoProviderError
|
2023-09-21 18:10:59 +00:00
|
|
|
|
2024-01-01 16:48:57 +00:00
|
|
|
class RetryProvider(BaseRetryProvider):
|
2024-02-27 10:55:40 +00:00
|
|
|
def __init__(
|
|
|
|
self,
|
|
|
|
providers: List[Type[BaseProvider]],
|
2024-04-12 21:29:43 +00:00
|
|
|
shuffle: bool = True,
|
|
|
|
single_provider_retry: bool = False,
|
|
|
|
max_retries: int = 3,
|
2024-02-27 10:55:40 +00:00
|
|
|
) -> None:
|
|
|
|
"""
|
|
|
|
Initialize the BaseRetryProvider.
|
|
|
|
Args:
|
|
|
|
providers (List[Type[BaseProvider]]): List of providers to use.
|
|
|
|
shuffle (bool): Whether to shuffle the providers list.
|
2024-04-12 21:29:43 +00:00
|
|
|
single_provider_retry (bool): Whether to retry a single provider if it fails.
|
|
|
|
max_retries (int): Maximum number of retries for a single provider.
|
2024-02-27 10:55:40 +00:00
|
|
|
"""
|
|
|
|
self.providers = providers
|
|
|
|
self.shuffle = shuffle
|
2024-04-12 21:29:43 +00:00
|
|
|
self.single_provider_retry = single_provider_retry
|
|
|
|
self.max_retries = max_retries
|
2024-02-27 10:55:40 +00:00
|
|
|
self.working = True
|
|
|
|
self.last_provider: Type[BaseProvider] = None
|
|
|
|
|
2023-09-21 18:10:59 +00:00
|
|
|
def create_completion(
|
|
|
|
self,
|
|
|
|
model: str,
|
2023-10-10 07:49:29 +00:00
|
|
|
messages: Messages,
|
2023-09-21 18:10:59 +00:00
|
|
|
stream: bool = False,
|
2024-04-12 21:29:43 +00:00
|
|
|
**kwargs,
|
2023-09-21 18:10:59 +00:00
|
|
|
) -> CreateResult:
|
2024-01-14 06:45:41 +00:00
|
|
|
"""
|
|
|
|
Create a completion using available providers, with an option to stream the response.
|
|
|
|
Args:
|
|
|
|
model (str): The model to be used for completion.
|
|
|
|
messages (Messages): The messages to be used for generating completion.
|
|
|
|
stream (bool, optional): Flag to indicate if the response should be streamed. Defaults to False.
|
|
|
|
Yields:
|
|
|
|
CreateResult: Tokens or results from the completion.
|
|
|
|
Raises:
|
|
|
|
Exception: Any exception encountered during the completion process.
|
|
|
|
"""
|
|
|
|
providers = [p for p in self.providers if stream and p.supports_stream] if stream else self.providers
|
2023-09-21 18:10:59 +00:00
|
|
|
if self.shuffle:
|
|
|
|
random.shuffle(providers)
|
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
exceptions = {}
|
2023-10-07 08:17:43 +00:00
|
|
|
started: bool = False
|
2024-04-12 21:29:43 +00:00
|
|
|
|
|
|
|
if self.single_provider_retry and len(providers) == 1:
|
|
|
|
provider = providers[0]
|
2024-01-01 16:48:57 +00:00
|
|
|
self.last_provider = provider
|
2024-04-12 21:29:43 +00:00
|
|
|
for attempt in range(self.max_retries):
|
|
|
|
try:
|
|
|
|
if debug.logging:
|
|
|
|
print(f"Using {provider.__name__} provider (attempt {attempt + 1})")
|
|
|
|
for token in provider.create_completion(model, messages, stream, **kwargs):
|
|
|
|
yield token
|
|
|
|
started = True
|
|
|
|
if started:
|
|
|
|
return
|
|
|
|
except Exception as e:
|
|
|
|
exceptions[provider.__name__] = e
|
|
|
|
if debug.logging:
|
|
|
|
print(f"{provider.__name__}: {e.__class__.__name__}: {e}")
|
|
|
|
if started:
|
|
|
|
raise e
|
|
|
|
else:
|
|
|
|
for provider in providers:
|
|
|
|
self.last_provider = provider
|
|
|
|
try:
|
|
|
|
if debug.logging:
|
|
|
|
print(f"Using {provider.__name__} provider")
|
|
|
|
for token in provider.create_completion(model, messages, stream, **kwargs):
|
|
|
|
yield token
|
2023-09-21 18:10:59 +00:00
|
|
|
started = True
|
2024-04-12 21:29:43 +00:00
|
|
|
if started:
|
|
|
|
return
|
|
|
|
except Exception as e:
|
|
|
|
exceptions[provider.__name__] = e
|
|
|
|
if debug.logging:
|
|
|
|
print(f"{provider.__name__}: {e.__class__.__name__}: {e}")
|
|
|
|
if started:
|
|
|
|
raise e
|
2023-09-21 18:10:59 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
raise_exceptions(exceptions)
|
2023-09-21 18:10:59 +00:00
|
|
|
|
|
|
|
async def create_async(
|
|
|
|
self,
|
|
|
|
model: str,
|
2023-10-10 07:49:29 +00:00
|
|
|
messages: Messages,
|
2024-04-12 21:29:43 +00:00
|
|
|
**kwargs,
|
2023-09-21 18:10:59 +00:00
|
|
|
) -> str:
|
2024-01-14 06:45:41 +00:00
|
|
|
"""
|
|
|
|
Asynchronously create a completion using available providers.
|
|
|
|
Args:
|
|
|
|
model (str): The model to be used for completion.
|
|
|
|
messages (Messages): The messages to be used for generating completion.
|
|
|
|
Returns:
|
|
|
|
str: The result of the asynchronous completion.
|
|
|
|
Raises:
|
|
|
|
Exception: Any exception encountered during the asynchronous completion process.
|
|
|
|
"""
|
2023-10-10 07:49:29 +00:00
|
|
|
providers = self.providers
|
2023-09-21 18:10:59 +00:00
|
|
|
if self.shuffle:
|
|
|
|
random.shuffle(providers)
|
2024-01-14 06:45:41 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
exceptions = {}
|
2024-04-12 21:29:43 +00:00
|
|
|
|
|
|
|
if self.single_provider_retry and len(providers) == 1:
|
|
|
|
provider = providers[0]
|
2024-01-01 16:48:57 +00:00
|
|
|
self.last_provider = provider
|
2024-04-12 21:29:43 +00:00
|
|
|
for attempt in range(self.max_retries):
|
|
|
|
try:
|
|
|
|
if debug.logging:
|
|
|
|
print(f"Using {provider.__name__} provider (attempt {attempt + 1})")
|
|
|
|
return await asyncio.wait_for(
|
|
|
|
provider.create_async(model, messages, **kwargs),
|
|
|
|
timeout=kwargs.get("timeout", 60),
|
|
|
|
)
|
|
|
|
except Exception as e:
|
|
|
|
exceptions[provider.__name__] = e
|
|
|
|
if debug.logging:
|
|
|
|
print(f"{provider.__name__}: {e.__class__.__name__}: {e}")
|
|
|
|
else:
|
|
|
|
for provider in providers:
|
|
|
|
self.last_provider = provider
|
|
|
|
try:
|
|
|
|
if debug.logging:
|
|
|
|
print(f"Using {provider.__name__} provider")
|
|
|
|
return await asyncio.wait_for(
|
|
|
|
provider.create_async(model, messages, **kwargs),
|
|
|
|
timeout=kwargs.get("timeout", 60),
|
|
|
|
)
|
|
|
|
except Exception as e:
|
|
|
|
exceptions[provider.__name__] = e
|
|
|
|
if debug.logging:
|
|
|
|
print(f"{provider.__name__}: {e.__class__.__name__}: {e}")
|
2024-01-14 06:45:41 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
raise_exceptions(exceptions)
|
2024-01-14 06:45:41 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
class IterProvider(BaseRetryProvider):
|
|
|
|
__name__ = "IterProvider"
|
2024-01-14 06:45:41 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
def __init__(
|
|
|
|
self,
|
|
|
|
providers: List[BaseProvider],
|
|
|
|
) -> None:
|
|
|
|
providers.reverse()
|
|
|
|
self.providers: List[BaseProvider] = providers
|
|
|
|
self.working: bool = True
|
|
|
|
self.last_provider: BaseProvider = None
|
|
|
|
|
|
|
|
def create_completion(
|
|
|
|
self,
|
|
|
|
model: str,
|
|
|
|
messages: Messages,
|
|
|
|
stream: bool = False,
|
|
|
|
**kwargs
|
|
|
|
) -> CreateResult:
|
|
|
|
exceptions: dict = {}
|
|
|
|
started: bool = False
|
|
|
|
for provider in self.iter_providers():
|
|
|
|
if stream and not provider.supports_stream:
|
|
|
|
continue
|
|
|
|
try:
|
|
|
|
for token in provider.create_completion(model, messages, stream, **kwargs):
|
|
|
|
yield token
|
|
|
|
started = True
|
|
|
|
if started:
|
|
|
|
return
|
|
|
|
except Exception as e:
|
|
|
|
exceptions[provider.__name__] = e
|
|
|
|
if debug.logging:
|
|
|
|
print(f"{provider.__name__}: {e.__class__.__name__}: {e}")
|
|
|
|
if started:
|
|
|
|
raise e
|
|
|
|
raise_exceptions(exceptions)
|
|
|
|
|
|
|
|
async def create_async(
|
|
|
|
self,
|
|
|
|
model: str,
|
|
|
|
messages: Messages,
|
|
|
|
**kwargs
|
|
|
|
) -> str:
|
|
|
|
exceptions: dict = {}
|
|
|
|
for provider in self.iter_providers():
|
|
|
|
try:
|
|
|
|
return await asyncio.wait_for(
|
|
|
|
provider.create_async(model, messages, **kwargs),
|
|
|
|
timeout=kwargs.get("timeout", 60)
|
|
|
|
)
|
|
|
|
except Exception as e:
|
|
|
|
exceptions[provider.__name__] = e
|
|
|
|
if debug.logging:
|
|
|
|
print(f"{provider.__name__}: {e.__class__.__name__}: {e}")
|
|
|
|
raise_exceptions(exceptions)
|
|
|
|
|
|
|
|
def iter_providers(self) -> Iterator[BaseProvider]:
|
|
|
|
used_provider = []
|
|
|
|
try:
|
|
|
|
while self.providers:
|
|
|
|
provider = self.providers.pop()
|
|
|
|
used_provider.append(provider)
|
|
|
|
self.last_provider = provider
|
|
|
|
if debug.logging:
|
|
|
|
print(f"Using {provider.__name__} provider")
|
|
|
|
yield provider
|
|
|
|
finally:
|
|
|
|
used_provider.reverse()
|
|
|
|
self.providers = [*used_provider, *self.providers]
|
|
|
|
|
|
|
|
def raise_exceptions(exceptions: dict) -> None:
|
|
|
|
"""
|
|
|
|
Raise a combined exception if any occurred during retries.
|
|
|
|
|
|
|
|
Raises:
|
|
|
|
RetryProviderError: If any provider encountered an exception.
|
|
|
|
RetryNoProviderError: If no provider is found.
|
|
|
|
"""
|
|
|
|
if exceptions:
|
|
|
|
raise RetryProviderError("RetryProvider failed:\n" + "\n".join([
|
|
|
|
f"{p}: {exception.__class__.__name__}: {exception}" for p, exception in exceptions.items()
|
|
|
|
]))
|
2024-01-14 06:45:41 +00:00
|
|
|
|
2024-02-27 10:55:40 +00:00
|
|
|
raise RetryNoProviderError("No provider found")
|