2023-10-01 05:27:21 +03:00
|
|
|
from __future__ import annotations
|
2024-02-22 02:16:58 +03:00
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
from dataclasses import dataclass
|
2024-02-22 02:16:58 +03:00
|
|
|
|
2024-05-19 06:09:55 +03:00
|
|
|
from .Provider import IterListProvider, ProviderType
|
2024-04-12 19:06:54 +03:00
|
|
|
from .Provider import (
|
2024-04-19 15:10:56 +03:00
|
|
|
Aichatos,
|
|
|
|
Bing,
|
|
|
|
Blackbox,
|
2023-10-01 05:27:21 +03:00
|
|
|
ChatgptAi,
|
2024-04-19 15:10:56 +03:00
|
|
|
ChatgptNext,
|
|
|
|
Cnote,
|
2023-10-26 22:32:49 +03:00
|
|
|
DeepInfra,
|
2024-04-19 15:10:56 +03:00
|
|
|
Feedough,
|
|
|
|
FreeGpt,
|
|
|
|
Gemini,
|
2024-05-19 06:09:55 +03:00
|
|
|
GeminiPro,
|
2024-03-14 01:29:49 +03:00
|
|
|
GigaChat,
|
2024-04-19 15:10:56 +03:00
|
|
|
HuggingChat,
|
|
|
|
HuggingFace,
|
|
|
|
Koala,
|
2023-11-18 06:38:31 +03:00
|
|
|
Liaobots,
|
2024-05-19 06:09:55 +03:00
|
|
|
MetaAI,
|
2024-04-19 15:10:56 +03:00
|
|
|
OpenaiChat,
|
|
|
|
PerplexityLabs,
|
2024-04-22 21:02:17 +03:00
|
|
|
Replicate,
|
2024-04-19 15:10:56 +03:00
|
|
|
Pi,
|
2024-02-09 16:24:15 +03:00
|
|
|
Vercel,
|
2023-10-05 06:13:37 +03:00
|
|
|
You,
|
2024-04-25 02:06:11 +03:00
|
|
|
Reka
|
2023-09-18 00:37:14 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2023-09-20 07:12:34 +03:00
|
|
|
@dataclass(unsafe_hash=True)
|
2023-09-18 00:23:54 +03:00
|
|
|
class Model:
|
2024-01-14 09:45:41 +03:00
|
|
|
"""
|
|
|
|
Represents a machine learning model configuration.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
name (str): Name of the model.
|
|
|
|
base_provider (str): Default provider for the model.
|
|
|
|
best_provider (ProviderType): The preferred provider for the model, typically with retry logic.
|
|
|
|
"""
|
2023-09-18 00:23:54 +03:00
|
|
|
name: str
|
|
|
|
base_provider: str
|
2024-01-01 19:48:57 +03:00
|
|
|
best_provider: ProviderType = None
|
2024-04-05 22:00:35 +03:00
|
|
|
|
2023-10-19 17:14:48 +03:00
|
|
|
@staticmethod
|
|
|
|
def __all__() -> list[str]:
|
2024-01-14 09:45:41 +03:00
|
|
|
"""Returns a list of all model names."""
|
2023-10-19 17:14:48 +03:00
|
|
|
return _all_models
|
2023-09-18 00:23:54 +03:00
|
|
|
|
|
|
|
default = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = "",
|
|
|
|
base_provider = "",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2023-11-16 18:56:23 +03:00
|
|
|
Bing,
|
2024-04-05 22:00:35 +03:00
|
|
|
ChatgptAi,
|
2023-11-16 18:56:23 +03:00
|
|
|
You,
|
2024-05-19 06:09:55 +03:00
|
|
|
OpenaiChat,
|
2023-10-05 06:13:37 +03:00
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2023-11-16 18:56:23 +03:00
|
|
|
# GPT-3.5 too, but all providers supports long requests and responses
|
2023-10-05 06:13:37 +03:00
|
|
|
gpt_35_long = Model(
|
|
|
|
name = 'gpt-3.5-turbo',
|
|
|
|
base_provider = 'openai',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-04-05 22:00:35 +03:00
|
|
|
FreeGpt,
|
|
|
|
You,
|
2023-11-18 06:38:31 +03:00
|
|
|
ChatgptNext,
|
2024-04-05 22:00:35 +03:00
|
|
|
OpenaiChat,
|
2024-05-19 06:09:55 +03:00
|
|
|
Koala,
|
2023-09-21 21:10:59 +03:00
|
|
|
])
|
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
|
|
|
# GPT-3.5 / GPT-4
|
|
|
|
gpt_35_turbo = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-3.5-turbo',
|
|
|
|
base_provider = 'openai',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-04-12 19:06:54 +03:00
|
|
|
FreeGpt,
|
|
|
|
You,
|
|
|
|
ChatgptNext,
|
|
|
|
Koala,
|
2024-04-13 00:56:38 +03:00
|
|
|
OpenaiChat,
|
2024-04-19 15:10:56 +03:00
|
|
|
Aichatos,
|
|
|
|
Cnote,
|
|
|
|
Feedough,
|
2024-04-12 19:06:54 +03:00
|
|
|
])
|
2023-09-18 00:23:54 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
gpt_4 = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-4',
|
|
|
|
base_provider = 'openai',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-02-09 10:49:37 +03:00
|
|
|
Bing, Liaobots,
|
2023-10-10 16:11:17 +03:00
|
|
|
])
|
2023-09-23 02:44:09 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-05-15 01:45:13 +03:00
|
|
|
gpt_4o = Model(
|
|
|
|
name = 'gpt-4o',
|
|
|
|
base_provider = 'openai',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
|
|
|
You, Liaobots
|
2024-05-15 01:45:13 +03:00
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2023-12-21 03:03:28 +03:00
|
|
|
gpt_4_turbo = Model(
|
|
|
|
name = 'gpt-4-turbo',
|
|
|
|
base_provider = 'openai',
|
|
|
|
best_provider = Bing
|
|
|
|
)
|
|
|
|
|
2024-03-14 01:29:49 +03:00
|
|
|
gigachat = Model(
|
|
|
|
name = 'GigaChat:latest',
|
|
|
|
base_provider = 'gigachat',
|
|
|
|
best_provider = GigaChat
|
|
|
|
)
|
|
|
|
|
2024-05-19 06:09:55 +03:00
|
|
|
meta = Model(
|
|
|
|
name = "meta",
|
2024-02-23 19:21:10 +03:00
|
|
|
base_provider = "meta",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = MetaAI
|
2024-04-19 10:27:33 +03:00
|
|
|
)
|
|
|
|
|
2024-04-19 15:10:56 +03:00
|
|
|
llama3_8b_instruct = Model(
|
2024-04-22 21:02:17 +03:00
|
|
|
name = "meta-llama/Meta-Llama-3-8B-Instruct",
|
2024-04-19 10:27:33 +03:00
|
|
|
base_provider = "meta",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([DeepInfra, PerplexityLabs, Replicate])
|
2024-04-19 10:27:33 +03:00
|
|
|
)
|
|
|
|
|
2024-04-19 15:10:56 +03:00
|
|
|
llama3_70b_instruct = Model(
|
2024-04-22 21:02:17 +03:00
|
|
|
name = "meta-llama/Meta-Llama-3-70B-Instruct",
|
2024-04-19 10:27:33 +03:00
|
|
|
base_provider = "meta",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([DeepInfra, PerplexityLabs, Replicate])
|
2024-01-23 07:02:14 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
codellama_34b_instruct = Model(
|
|
|
|
name = "codellama/CodeLlama-34b-Instruct-hf",
|
2024-02-23 19:21:10 +03:00
|
|
|
base_provider = "meta",
|
2024-04-12 06:18:08 +03:00
|
|
|
best_provider = HuggingChat
|
2024-01-01 19:48:57 +03:00
|
|
|
)
|
2023-10-26 22:32:49 +03:00
|
|
|
|
2024-02-04 21:50:32 +03:00
|
|
|
codellama_70b_instruct = Model(
|
|
|
|
name = "codellama/CodeLlama-70b-Instruct-hf",
|
2024-02-23 19:21:10 +03:00
|
|
|
base_provider = "meta",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([DeepInfra, PerplexityLabs])
|
2024-02-04 21:50:32 +03:00
|
|
|
)
|
|
|
|
|
2024-01-23 13:35:37 +03:00
|
|
|
# Mistral
|
2023-12-13 15:15:27 +03:00
|
|
|
mixtral_8x7b = Model(
|
|
|
|
name = "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
|
|
|
base_provider = "huggingface",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([DeepInfra, HuggingFace, PerplexityLabs])
|
2024-01-01 19:48:57 +03:00
|
|
|
)
|
2023-12-13 15:15:27 +03:00
|
|
|
|
|
|
|
mistral_7b = Model(
|
|
|
|
name = "mistralai/Mistral-7B-Instruct-v0.1",
|
|
|
|
base_provider = "huggingface",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([HuggingChat, HuggingFace, PerplexityLabs])
|
2024-04-12 06:18:08 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
mistral_7b_v02 = Model(
|
|
|
|
name = "mistralai/Mistral-7B-Instruct-v0.2",
|
|
|
|
base_provider = "huggingface",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([DeepInfra, HuggingFace, PerplexityLabs])
|
2024-01-01 19:48:57 +03:00
|
|
|
)
|
2023-12-13 15:15:27 +03:00
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
# Bard
|
2024-05-19 06:09:55 +03:00
|
|
|
gemini = Model(
|
2024-02-09 16:24:15 +03:00
|
|
|
name = 'gemini',
|
2023-10-01 05:27:21 +03:00
|
|
|
base_provider = 'google',
|
2024-02-09 16:24:15 +03:00
|
|
|
best_provider = Gemini
|
2024-01-23 07:02:14 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
|
|
|
claude_v2 = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'claude-v2',
|
|
|
|
base_provider = 'anthropic',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([Vercel])
|
2024-01-23 07:02:14 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-03-11 04:41:59 +03:00
|
|
|
claude_3_opus = Model(
|
|
|
|
name = 'claude-3-opus',
|
|
|
|
base_provider = 'anthropic',
|
|
|
|
best_provider = You
|
|
|
|
)
|
|
|
|
|
|
|
|
claude_3_sonnet = Model(
|
|
|
|
name = 'claude-3-sonnet',
|
|
|
|
base_provider = 'anthropic',
|
|
|
|
best_provider = You
|
|
|
|
)
|
|
|
|
|
2024-05-19 06:09:55 +03:00
|
|
|
claude_3_haiku = Model(
|
|
|
|
name = 'claude-3-haiku',
|
|
|
|
base_provider = 'anthropic',
|
2024-06-09 23:28:07 +03:00
|
|
|
best_provider = None
|
2024-05-19 06:09:55 +03:00
|
|
|
)
|
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
gpt_35_turbo_16k = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-3.5-turbo-16k',
|
|
|
|
base_provider = 'openai',
|
2024-01-23 07:02:14 +03:00
|
|
|
best_provider = gpt_35_long.best_provider
|
|
|
|
)
|
2023-09-20 06:00:19 +03:00
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
gpt_35_turbo_16k_0613 = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-3.5-turbo-16k-0613',
|
2023-10-10 16:11:17 +03:00
|
|
|
base_provider = 'openai',
|
2023-10-19 21:37:56 +03:00
|
|
|
best_provider = gpt_35_long.best_provider
|
2023-10-10 16:11:17 +03:00
|
|
|
)
|
2023-09-22 22:36:44 +03:00
|
|
|
|
|
|
|
gpt_35_turbo_0613 = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-3.5-turbo-0613',
|
2023-10-10 01:45:44 +03:00
|
|
|
base_provider = 'openai',
|
2023-10-11 20:56:53 +03:00
|
|
|
best_provider = gpt_35_turbo.best_provider
|
2023-09-25 16:52:19 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
|
|
|
gpt_4_0613 = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-4-0613',
|
2023-10-10 16:11:17 +03:00
|
|
|
base_provider = 'openai',
|
2023-10-11 20:56:53 +03:00
|
|
|
best_provider = gpt_4.best_provider
|
2023-10-07 20:10:26 +03:00
|
|
|
)
|
2023-09-29 17:21:18 +03:00
|
|
|
|
|
|
|
gpt_4_32k = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-4-32k',
|
2023-10-10 16:11:17 +03:00
|
|
|
base_provider = 'openai',
|
2023-10-11 20:56:53 +03:00
|
|
|
best_provider = gpt_4.best_provider
|
2023-10-07 20:10:26 +03:00
|
|
|
)
|
2023-09-29 17:21:18 +03:00
|
|
|
|
|
|
|
gpt_4_32k_0613 = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-4-32k-0613',
|
2023-10-10 16:11:17 +03:00
|
|
|
base_provider = 'openai',
|
2023-10-11 20:56:53 +03:00
|
|
|
best_provider = gpt_4.best_provider
|
2023-10-07 20:10:26 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-01-13 17:58:12 +03:00
|
|
|
gemini_pro = Model(
|
|
|
|
name = 'gemini-pro',
|
|
|
|
base_provider = 'google',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([GeminiPro, You])
|
2024-01-13 17:58:12 +03:00
|
|
|
)
|
|
|
|
|
2023-12-02 01:11:52 +03:00
|
|
|
pi = Model(
|
|
|
|
name = 'pi',
|
|
|
|
base_provider = 'inflection',
|
2024-01-23 03:47:55 +03:00
|
|
|
best_provider = Pi
|
2023-12-02 01:11:52 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-04-13 04:46:20 +03:00
|
|
|
dbrx_instruct = Model(
|
|
|
|
name = 'databricks/dbrx-instruct',
|
|
|
|
base_provider = 'mistral',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([DeepInfra, PerplexityLabs])
|
2024-04-13 05:09:11 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
command_r_plus = Model(
|
|
|
|
name = 'CohereForAI/c4ai-command-r-plus',
|
|
|
|
base_provider = 'mistral',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([HuggingChat])
|
2024-04-13 04:46:20 +03:00
|
|
|
)
|
|
|
|
|
2024-04-19 15:10:56 +03:00
|
|
|
blackbox = Model(
|
|
|
|
name = 'blackbox',
|
|
|
|
base_provider = 'blackbox',
|
|
|
|
best_provider = Blackbox
|
|
|
|
)
|
|
|
|
|
2024-04-25 02:06:11 +03:00
|
|
|
reka_core = Model(
|
|
|
|
name = 'reka-core',
|
|
|
|
base_provider = 'Reka AI',
|
|
|
|
best_provider = Reka
|
|
|
|
)
|
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
class ModelUtils:
|
2024-01-14 09:45:41 +03:00
|
|
|
"""
|
|
|
|
Utility class for mapping string identifiers to Model instances.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
convert (dict[str, Model]): Dictionary mapping model string identifiers to Model instances.
|
|
|
|
"""
|
2023-09-18 00:23:54 +03:00
|
|
|
convert: dict[str, Model] = {
|
2023-10-01 05:27:21 +03:00
|
|
|
# gpt-3.5
|
|
|
|
'gpt-3.5-turbo' : gpt_35_turbo,
|
2023-10-06 21:53:17 +03:00
|
|
|
'gpt-3.5-turbo-0613' : gpt_35_turbo_0613,
|
2023-10-01 05:27:21 +03:00
|
|
|
'gpt-3.5-turbo-16k' : gpt_35_turbo_16k,
|
|
|
|
'gpt-3.5-turbo-16k-0613' : gpt_35_turbo_16k_0613,
|
2023-12-06 13:54:50 +03:00
|
|
|
'gpt-3.5-long': gpt_35_long,
|
2024-05-19 06:09:55 +03:00
|
|
|
|
2023-10-01 05:27:21 +03:00
|
|
|
# gpt-4
|
2024-05-15 01:45:13 +03:00
|
|
|
'gpt-4o' : gpt_4o,
|
2023-10-01 05:27:21 +03:00
|
|
|
'gpt-4' : gpt_4,
|
|
|
|
'gpt-4-0613' : gpt_4_0613,
|
|
|
|
'gpt-4-32k' : gpt_4_32k,
|
|
|
|
'gpt-4-32k-0613' : gpt_4_32k_0613,
|
2023-12-21 03:03:28 +03:00
|
|
|
'gpt-4-turbo' : gpt_4_turbo,
|
2023-10-26 22:42:30 +03:00
|
|
|
|
2024-05-19 06:09:55 +03:00
|
|
|
"meta-ai": meta,
|
|
|
|
'llama3-8b': llama3_8b_instruct, # alias
|
2024-04-25 02:06:11 +03:00
|
|
|
'llama3-70b': llama3_70b_instruct, # alias
|
2024-04-19 15:10:56 +03:00
|
|
|
'llama3-8b-instruct' : llama3_8b_instruct,
|
|
|
|
'llama3-70b-instruct': llama3_70b_instruct,
|
2024-05-19 06:09:55 +03:00
|
|
|
|
2024-01-23 07:02:14 +03:00
|
|
|
'codellama-34b-instruct': codellama_34b_instruct,
|
2024-02-04 21:50:32 +03:00
|
|
|
'codellama-70b-instruct': codellama_70b_instruct,
|
2024-03-14 01:29:49 +03:00
|
|
|
|
2024-04-13 04:46:20 +03:00
|
|
|
# Mistral Opensource
|
2023-12-13 15:15:27 +03:00
|
|
|
'mixtral-8x7b': mixtral_8x7b,
|
|
|
|
'mistral-7b': mistral_7b,
|
2024-04-12 06:18:08 +03:00
|
|
|
'mistral-7b-v02': mistral_7b_v02,
|
2024-05-19 06:09:55 +03:00
|
|
|
|
2024-04-13 04:46:20 +03:00
|
|
|
# google gemini
|
2024-02-09 16:24:15 +03:00
|
|
|
'gemini': gemini,
|
2024-01-13 17:58:12 +03:00
|
|
|
'gemini-pro': gemini_pro,
|
2024-05-19 06:09:55 +03:00
|
|
|
|
2024-04-13 04:46:20 +03:00
|
|
|
# anthropic
|
2024-01-23 07:02:14 +03:00
|
|
|
'claude-v2': claude_v2,
|
2024-03-11 04:41:59 +03:00
|
|
|
'claude-3-opus': claude_3_opus,
|
|
|
|
'claude-3-sonnet': claude_3_sonnet,
|
2024-05-19 06:09:55 +03:00
|
|
|
'claude-3-haiku': claude_3_haiku,
|
|
|
|
|
2024-04-25 02:06:11 +03:00
|
|
|
# reka core
|
|
|
|
'reka': reka_core,
|
2024-05-19 06:09:55 +03:00
|
|
|
|
2024-04-13 04:46:20 +03:00
|
|
|
# other
|
2024-04-19 15:10:56 +03:00
|
|
|
'blackbox': blackbox,
|
2024-04-13 05:09:11 +03:00
|
|
|
'command-r+': command_r_plus,
|
2024-04-13 04:46:20 +03:00
|
|
|
'dbrx-instruct': dbrx_instruct,
|
2024-05-19 06:09:55 +03:00
|
|
|
'gigachat': gigachat,
|
2023-12-02 01:11:52 +03:00
|
|
|
'pi': pi
|
2023-10-01 05:27:21 +03:00
|
|
|
}
|
2023-10-19 17:14:48 +03:00
|
|
|
|
2024-02-04 21:50:32 +03:00
|
|
|
_all_models = list(ModelUtils.convert.keys())
|