gpt4free/g4f/models.py

398 lines
9.2 KiB
Python
Raw Normal View History

2023-10-01 02:27:21 +00:00
from __future__ import annotations
2023-09-17 21:23:54 +00:00
from dataclasses import dataclass
2024-03-13 22:29:49 +00:00
from .Provider import RetryProvider, ProviderType
from .Provider import (
Aichatos,
Bing,
Blackbox,
Chatgpt4Online,
2023-10-01 02:27:21 +00:00
ChatgptAi,
ChatgptNext,
Cohere,
Cnote,
2023-10-26 19:32:49 +00:00
DeepInfra,
Feedough,
FreeGpt,
Gemini,
GeminiProChat,
2024-03-13 22:29:49 +00:00
GigaChat,
HuggingChat,
HuggingFace,
Koala,
Liaobots,
Llama,
OpenaiChat,
PerplexityLabs,
2024-04-22 18:02:17 +00:00
Replicate,
Pi,
Vercel,
You,
2024-04-24 23:06:11 +00:00
Reka
)
2023-09-17 21:23:54 +00:00
@dataclass(unsafe_hash=True)
2023-09-17 21:23:54 +00:00
class Model:
"""
Represents a machine learning model configuration.
Attributes:
name (str): Name of the model.
base_provider (str): Default provider for the model.
best_provider (ProviderType): The preferred provider for the model, typically with retry logic.
"""
2023-09-17 21:23:54 +00:00
name: str
base_provider: str
best_provider: ProviderType = None
2024-04-05 19:00:35 +00:00
2023-10-19 14:14:48 +00:00
@staticmethod
def __all__() -> list[str]:
"""Returns a list of all model names."""
2023-10-19 14:14:48 +00:00
return _all_models
2023-09-17 21:23:54 +00:00
default = Model(
2023-10-01 02:27:21 +00:00
name = "",
base_provider = "",
best_provider = RetryProvider([
Bing,
2024-04-05 19:00:35 +00:00
ChatgptAi,
You,
2024-04-05 19:00:35 +00:00
Chatgpt4Online,
OpenaiChat
])
)
# GPT-3.5 too, but all providers supports long requests and responses
gpt_35_long = Model(
name = 'gpt-3.5-turbo',
base_provider = 'openai',
best_provider = RetryProvider([
2024-04-05 19:00:35 +00:00
FreeGpt,
You,
ChatgptNext,
2024-04-05 19:00:35 +00:00
OpenaiChat,
2023-09-21 18:10:59 +00:00
])
)
2023-09-17 21:23:54 +00:00
# GPT-3.5 / GPT-4
gpt_35_turbo = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-3.5-turbo',
base_provider = 'openai',
best_provider = RetryProvider([
FreeGpt,
You,
ChatgptNext,
Koala,
2024-04-12 21:56:38 +00:00
OpenaiChat,
Aichatos,
Cnote,
Feedough,
])
2023-09-17 21:23:54 +00:00
)
gpt_4 = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-4',
base_provider = 'openai',
2023-10-10 13:11:17 +00:00
best_provider = RetryProvider([
Bing, Liaobots,
2023-10-10 13:11:17 +00:00
])
)
2023-09-17 21:23:54 +00:00
2024-05-14 22:45:13 +00:00
gpt_4o = Model(
name = 'gpt-4o',
base_provider = 'openai',
best_provider = RetryProvider([
You
])
)
2023-12-21 00:03:28 +00:00
gpt_4_turbo = Model(
name = 'gpt-4-turbo',
base_provider = 'openai',
best_provider = Bing
)
2024-03-13 22:29:49 +00:00
gigachat = Model(
name = 'GigaChat:latest',
base_provider = 'gigachat',
best_provider = GigaChat
)
gigachat_plus = Model(
name = 'GigaChat-Plus',
base_provider = 'gigachat',
best_provider = GigaChat
)
gigachat_pro = Model(
name = 'GigaChat-Pro',
base_provider = 'gigachat',
best_provider = GigaChat
)
2023-10-26 19:32:49 +00:00
llama2_7b = Model(
name = "meta-llama/Llama-2-7b-chat-hf",
2024-02-23 16:21:10 +00:00
base_provider = 'meta',
best_provider = RetryProvider([Llama, DeepInfra])
)
2023-10-26 19:32:49 +00:00
llama2_13b = Model(
name = "meta-llama/Llama-2-13b-chat-hf",
2024-02-23 16:21:10 +00:00
base_provider = 'meta',
best_provider = RetryProvider([Llama, DeepInfra])
)
2023-10-26 19:32:49 +00:00
llama2_70b = Model(
name = "meta-llama/Llama-2-70b-chat-hf",
2024-02-23 16:21:10 +00:00
base_provider = "meta",
2024-04-22 18:02:17 +00:00
best_provider = RetryProvider([Llama, DeepInfra])
)
llama3_8b_instruct = Model(
2024-04-22 18:02:17 +00:00
name = "meta-llama/Meta-Llama-3-8B-Instruct",
base_provider = "meta",
2024-04-22 18:02:17 +00:00
best_provider = RetryProvider([Llama, DeepInfra, Replicate])
)
llama3_70b_instruct = Model(
2024-04-22 18:02:17 +00:00
name = "meta-llama/Meta-Llama-3-70B-Instruct",
base_provider = "meta",
2024-04-22 18:02:17 +00:00
best_provider = RetryProvider([Llama, DeepInfra])
2024-01-23 04:02:14 +00:00
)
codellama_34b_instruct = Model(
name = "codellama/CodeLlama-34b-Instruct-hf",
2024-02-23 16:21:10 +00:00
base_provider = "meta",
2024-04-12 03:18:08 +00:00
best_provider = HuggingChat
)
2023-10-26 19:32:49 +00:00
2024-02-04 18:50:32 +00:00
codellama_70b_instruct = Model(
name = "codellama/CodeLlama-70b-Instruct-hf",
2024-02-23 16:21:10 +00:00
base_provider = "meta",
best_provider = RetryProvider([DeepInfra, PerplexityLabs])
2024-02-04 18:50:32 +00:00
)
# Mistral
2023-12-13 12:15:27 +00:00
mixtral_8x7b = Model(
name = "mistralai/Mixtral-8x7B-Instruct-v0.1",
base_provider = "huggingface",
2024-04-22 18:02:17 +00:00
best_provider = RetryProvider([DeepInfra, HuggingFace, PerplexityLabs])
)
2023-12-13 12:15:27 +00:00
mistral_7b = Model(
name = "mistralai/Mistral-7B-Instruct-v0.1",
base_provider = "huggingface",
2024-04-12 03:18:08 +00:00
best_provider = RetryProvider([HuggingChat, HuggingFace, PerplexityLabs])
)
mistral_7b_v02 = Model(
name = "mistralai/Mistral-7B-Instruct-v0.2",
base_provider = "huggingface",
best_provider = DeepInfra
)
2024-04-13 01:46:20 +00:00
mixtral_8x22b = Model(
name = "HuggingFaceH4/zephyr-orpo-141b-A35b-v0.1",
base_provider = "huggingface",
2024-04-22 18:02:17 +00:00
best_provider = DeepInfra
2024-04-13 01:46:20 +00:00
)
2024-04-12 03:18:08 +00:00
# Misc models
2024-01-21 05:20:45 +00:00
dolphin_mixtral_8x7b = Model(
name = "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
base_provider = "huggingface",
best_provider = DeepInfra
)
lzlv_70b = Model(
name = "lizpreciatior/lzlv_70b_fp16_hf",
base_provider = "huggingface",
best_provider = DeepInfra
)
airoboros_70b = Model(
name = "deepinfra/airoboros-70b",
base_provider = "huggingface",
best_provider = DeepInfra
)
openchat_35 = Model(
name = "openchat/openchat_3.5",
base_provider = "huggingface",
2024-04-22 18:02:17 +00:00
best_provider = DeepInfra
)
2023-12-13 12:15:27 +00:00
2023-09-17 21:23:54 +00:00
# Bard
gemini = bard = palm = Model(
name = 'gemini',
2023-10-01 02:27:21 +00:00
base_provider = 'google',
best_provider = Gemini
2024-01-23 04:02:14 +00:00
)
2023-09-17 21:23:54 +00:00
claude_v2 = Model(
2023-10-01 02:27:21 +00:00
name = 'claude-v2',
base_provider = 'anthropic',
best_provider = RetryProvider([Vercel])
2024-01-23 04:02:14 +00:00
)
2023-09-17 21:23:54 +00:00
claude_3_opus = Model(
name = 'claude-3-opus',
base_provider = 'anthropic',
best_provider = You
)
claude_3_sonnet = Model(
name = 'claude-3-sonnet',
base_provider = 'anthropic',
best_provider = You
)
2023-09-17 21:23:54 +00:00
gpt_35_turbo_16k = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-3.5-turbo-16k',
base_provider = 'openai',
2024-01-23 04:02:14 +00:00
best_provider = gpt_35_long.best_provider
)
2023-09-20 03:00:19 +00:00
2023-09-17 21:23:54 +00:00
gpt_35_turbo_16k_0613 = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-3.5-turbo-16k-0613',
2023-10-10 13:11:17 +00:00
base_provider = 'openai',
2023-10-19 18:37:56 +00:00
best_provider = gpt_35_long.best_provider
2023-10-10 13:11:17 +00:00
)
2023-09-22 19:36:44 +00:00
gpt_35_turbo_0613 = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-3.5-turbo-0613',
2023-10-09 22:45:44 +00:00
base_provider = 'openai',
2023-10-11 17:56:53 +00:00
best_provider = gpt_35_turbo.best_provider
)
2023-09-17 21:23:54 +00:00
gpt_4_0613 = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-4-0613',
2023-10-10 13:11:17 +00:00
base_provider = 'openai',
2023-10-11 17:56:53 +00:00
best_provider = gpt_4.best_provider
2023-10-07 17:10:26 +00:00
)
gpt_4_32k = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-4-32k',
2023-10-10 13:11:17 +00:00
base_provider = 'openai',
2023-10-11 17:56:53 +00:00
best_provider = gpt_4.best_provider
2023-10-07 17:10:26 +00:00
)
gpt_4_32k_0613 = Model(
2023-10-01 02:27:21 +00:00
name = 'gpt-4-32k-0613',
2023-10-10 13:11:17 +00:00
base_provider = 'openai',
2023-10-11 17:56:53 +00:00
best_provider = gpt_4.best_provider
2023-10-07 17:10:26 +00:00
)
2023-09-17 21:23:54 +00:00
gemini_pro = Model(
name = 'gemini-pro',
base_provider = 'google',
best_provider = RetryProvider([GeminiProChat, You])
)
pi = Model(
name = 'pi',
base_provider = 'inflection',
best_provider = Pi
)
2023-09-17 21:23:54 +00:00
2024-04-13 01:46:20 +00:00
dbrx_instruct = Model(
name = 'databricks/dbrx-instruct',
base_provider = 'mistral',
2024-04-13 02:09:11 +00:00
best_provider = RetryProvider([DeepInfra, PerplexityLabs])
)
command_r_plus = Model(
name = 'CohereForAI/c4ai-command-r-plus',
base_provider = 'mistral',
2024-04-16 10:28:54 +00:00
best_provider = RetryProvider([HuggingChat, Cohere])
2024-04-13 01:46:20 +00:00
)
blackbox = Model(
name = 'blackbox',
base_provider = 'blackbox',
best_provider = Blackbox
)
2024-04-24 23:06:11 +00:00
reka_core = Model(
name = 'reka-core',
base_provider = 'Reka AI',
best_provider = Reka
)
2023-09-17 21:23:54 +00:00
class ModelUtils:
"""
Utility class for mapping string identifiers to Model instances.
Attributes:
convert (dict[str, Model]): Dictionary mapping model string identifiers to Model instances.
"""
2023-09-17 21:23:54 +00:00
convert: dict[str, Model] = {
2023-10-01 02:27:21 +00:00
# gpt-3.5
'gpt-3.5-turbo' : gpt_35_turbo,
2023-10-06 18:53:17 +00:00
'gpt-3.5-turbo-0613' : gpt_35_turbo_0613,
2023-10-01 02:27:21 +00:00
'gpt-3.5-turbo-16k' : gpt_35_turbo_16k,
'gpt-3.5-turbo-16k-0613' : gpt_35_turbo_16k_0613,
2023-12-06 10:54:50 +00:00
'gpt-3.5-long': gpt_35_long,
2023-10-01 02:27:21 +00:00
# gpt-4
2024-05-14 22:45:13 +00:00
'gpt-4o' : gpt_4o,
2023-10-01 02:27:21 +00:00
'gpt-4' : gpt_4,
'gpt-4-0613' : gpt_4_0613,
'gpt-4-32k' : gpt_4_32k,
'gpt-4-32k-0613' : gpt_4_32k_0613,
2023-12-21 00:03:28 +00:00
'gpt-4-turbo' : gpt_4_turbo,
2023-10-26 19:42:30 +00:00
# Llama
2023-10-26 19:42:30 +00:00
'llama2-7b' : llama2_7b,
'llama2-13b': llama2_13b,
'llama2-70b': llama2_70b,
2024-04-24 23:06:11 +00:00
'llama3-8b' : llama3_8b_instruct, # alias
'llama3-70b': llama3_70b_instruct, # alias
'llama3-8b-instruct' : llama3_8b_instruct,
'llama3-70b-instruct': llama3_70b_instruct,
2024-04-24 23:06:11 +00:00
2024-01-23 04:02:14 +00:00
'codellama-34b-instruct': codellama_34b_instruct,
2024-02-04 18:50:32 +00:00
'codellama-70b-instruct': codellama_70b_instruct,
2024-03-13 22:29:49 +00:00
# GigaChat
'gigachat' : gigachat,
'gigachat_plus': gigachat_plus,
'gigachat_pro' : gigachat_pro,
2024-04-13 01:46:20 +00:00
# Mistral Opensource
2023-12-13 12:15:27 +00:00
'mixtral-8x7b': mixtral_8x7b,
'mistral-7b': mistral_7b,
2024-04-12 03:18:08 +00:00
'mistral-7b-v02': mistral_7b_v02,
2024-04-13 01:46:20 +00:00
'mixtral-8x22b': mixtral_8x22b,
2024-01-21 05:20:45 +00:00
'dolphin-mixtral-8x7b': dolphin_mixtral_8x7b,
2024-04-13 01:46:20 +00:00
# google gemini
'gemini': gemini,
'gemini-pro': gemini_pro,
2024-04-13 01:46:20 +00:00
# anthropic
2024-01-23 04:02:14 +00:00
'claude-v2': claude_v2,
'claude-3-opus': claude_3_opus,
'claude-3-sonnet': claude_3_sonnet,
2024-04-13 01:46:20 +00:00
2024-04-24 23:06:11 +00:00
# reka core
'reka-core': reka_core,
'reka': reka_core,
'Reka Core': reka_core,
2024-04-13 01:46:20 +00:00
# other
'blackbox': blackbox,
2024-04-13 02:09:11 +00:00
'command-r+': command_r_plus,
2024-04-13 01:46:20 +00:00
'dbrx-instruct': dbrx_instruct,
'lzlv-70b': lzlv_70b,
'airoboros-70b': airoboros_70b,
'openchat_3.5': openchat_35,
'pi': pi
2023-10-01 02:27:21 +00:00
}
2023-10-19 14:14:48 +00:00
2024-02-04 18:50:32 +00:00
_all_models = list(ModelUtils.convert.keys())