2023-10-01 05:27:21 +03:00
|
|
|
from __future__ import annotations
|
2024-02-22 02:16:58 +03:00
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
from dataclasses import dataclass
|
2024-02-22 02:16:58 +03:00
|
|
|
|
2024-05-19 06:09:55 +03:00
|
|
|
from .Provider import IterListProvider, ProviderType
|
2024-04-12 19:06:54 +03:00
|
|
|
from .Provider import (
|
2024-09-27 00:24:44 +03:00
|
|
|
AIChatFree,
|
2024-09-13 17:09:31 +03:00
|
|
|
Airforce,
|
2024-07-25 09:21:55 +03:00
|
|
|
Allyfy,
|
2024-07-29 01:37:16 +03:00
|
|
|
Bing,
|
2024-09-06 22:15:35 +03:00
|
|
|
Binjie,
|
2024-09-06 19:32:18 +03:00
|
|
|
Bixin123,
|
2024-07-29 01:37:16 +03:00
|
|
|
Blackbox,
|
2024-09-19 21:58:37 +03:00
|
|
|
ChatGpt,
|
2024-09-02 11:55:51 +03:00
|
|
|
Chatgpt4o,
|
2024-09-24 13:23:53 +03:00
|
|
|
Chatgpt4Online,
|
|
|
|
ChatGptEs,
|
2024-07-29 01:37:16 +03:00
|
|
|
ChatgptFree,
|
|
|
|
DDG,
|
|
|
|
DeepInfra,
|
2024-09-24 13:23:53 +03:00
|
|
|
DeepInfraChat,
|
2024-07-29 01:37:16 +03:00
|
|
|
DeepInfraImage,
|
2024-09-06 23:19:18 +03:00
|
|
|
Free2GPT,
|
2024-07-29 01:37:16 +03:00
|
|
|
FreeChatgpt,
|
|
|
|
FreeGpt,
|
2024-07-30 01:15:36 +03:00
|
|
|
FreeNetfly,
|
2024-07-29 01:37:16 +03:00
|
|
|
Gemini,
|
|
|
|
GeminiPro,
|
|
|
|
GigaChat,
|
|
|
|
HuggingChat,
|
|
|
|
HuggingFace,
|
|
|
|
Koala,
|
|
|
|
Liaobots,
|
2024-09-24 13:23:53 +03:00
|
|
|
LiteIcoding,
|
2024-09-07 01:16:11 +03:00
|
|
|
MagickPen,
|
2024-07-29 01:37:16 +03:00
|
|
|
MetaAI,
|
2024-09-04 02:09:29 +03:00
|
|
|
Nexra,
|
2024-07-29 01:37:16 +03:00
|
|
|
OpenaiChat,
|
|
|
|
PerplexityLabs,
|
|
|
|
Pi,
|
|
|
|
Pizzagpt,
|
|
|
|
Reka,
|
|
|
|
Replicate,
|
|
|
|
ReplicateHome,
|
2024-09-02 11:55:51 +03:00
|
|
|
TeachAnything,
|
2024-08-31 09:47:39 +03:00
|
|
|
Upstage,
|
2024-07-29 01:37:16 +03:00
|
|
|
You,
|
2023-09-18 00:37:14 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-07-29 01:37:16 +03:00
|
|
|
|
2023-09-20 07:12:34 +03:00
|
|
|
@dataclass(unsafe_hash=True)
|
2023-09-18 00:23:54 +03:00
|
|
|
class Model:
|
2024-01-14 09:45:41 +03:00
|
|
|
"""
|
|
|
|
Represents a machine learning model configuration.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
name (str): Name of the model.
|
|
|
|
base_provider (str): Default provider for the model.
|
|
|
|
best_provider (ProviderType): The preferred provider for the model, typically with retry logic.
|
|
|
|
"""
|
2023-09-18 00:23:54 +03:00
|
|
|
name: str
|
|
|
|
base_provider: str
|
2024-01-01 19:48:57 +03:00
|
|
|
best_provider: ProviderType = None
|
2024-04-05 22:00:35 +03:00
|
|
|
|
2023-10-19 17:14:48 +03:00
|
|
|
@staticmethod
|
|
|
|
def __all__() -> list[str]:
|
2024-01-14 09:45:41 +03:00
|
|
|
"""Returns a list of all model names."""
|
2023-10-19 17:14:48 +03:00
|
|
|
return _all_models
|
2023-09-18 00:23:54 +03:00
|
|
|
|
|
|
|
default = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = "",
|
|
|
|
base_provider = "",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-07-08 23:41:19 +03:00
|
|
|
DDG,
|
|
|
|
FreeChatgpt,
|
2024-08-31 09:47:39 +03:00
|
|
|
HuggingChat,
|
2024-07-08 23:41:19 +03:00
|
|
|
Pizzagpt,
|
2024-08-31 09:47:39 +03:00
|
|
|
ReplicateHome,
|
|
|
|
Upstage,
|
2024-09-05 10:00:20 +03:00
|
|
|
Blackbox,
|
2024-09-06 19:32:18 +03:00
|
|
|
Bixin123,
|
2024-09-06 22:15:35 +03:00
|
|
|
Binjie,
|
2024-09-06 23:19:18 +03:00
|
|
|
Free2GPT,
|
2024-09-07 01:34:47 +03:00
|
|
|
MagickPen,
|
2024-09-24 13:23:53 +03:00
|
|
|
DeepInfraChat,
|
|
|
|
LiteIcoding,
|
2023-09-21 21:10:59 +03:00
|
|
|
])
|
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
############
|
|
|
|
### Text ###
|
|
|
|
############
|
|
|
|
|
|
|
|
### OpenAI ###
|
2024-09-04 02:09:29 +03:00
|
|
|
# gpt-3
|
|
|
|
gpt_3 = Model(
|
|
|
|
name = 'gpt-3',
|
|
|
|
base_provider = 'OpenAI',
|
|
|
|
best_provider = IterListProvider([
|
|
|
|
Nexra,
|
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
# gpt-3.5
|
2023-09-18 00:23:54 +03:00
|
|
|
gpt_35_turbo = Model(
|
2023-10-01 05:27:21 +03:00
|
|
|
name = 'gpt-3.5-turbo',
|
2024-09-04 02:09:29 +03:00
|
|
|
base_provider = 'OpenAI',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-09-24 13:23:53 +03:00
|
|
|
Allyfy, Nexra, Bixin123, Airforce,
|
2024-04-12 19:06:54 +03:00
|
|
|
])
|
2023-09-18 00:23:54 +03:00
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
# gpt-4
|
2024-08-31 09:47:39 +03:00
|
|
|
gpt_4o = Model(
|
|
|
|
name = 'gpt-4o',
|
2024-09-04 02:09:29 +03:00
|
|
|
base_provider = 'OpenAI',
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-09-24 13:23:53 +03:00
|
|
|
Liaobots, Airforce, Chatgpt4o, ChatGptEs,
|
2024-09-19 21:58:37 +03:00
|
|
|
OpenaiChat
|
2023-10-10 16:11:17 +03:00
|
|
|
])
|
2023-09-23 02:44:09 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
gpt_4o_mini = Model(
|
|
|
|
name = 'gpt-4o-mini',
|
2024-09-04 02:09:29 +03:00
|
|
|
base_provider = 'OpenAI',
|
2024-07-28 13:34:28 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-09-24 13:23:53 +03:00
|
|
|
DDG, ChatGptEs, You, FreeNetfly, Pizzagpt, LiteIcoding, MagickPen, Liaobots, Airforce, ChatgptFree, Koala,
|
|
|
|
OpenaiChat, ChatGpt
|
2024-07-28 13:34:28 +03:00
|
|
|
])
|
2023-12-21 03:03:28 +03:00
|
|
|
)
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
gpt_4_turbo = Model(
|
|
|
|
name = 'gpt-4-turbo',
|
2024-09-04 02:09:29 +03:00
|
|
|
base_provider = 'OpenAI',
|
2024-07-08 23:41:19 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-09-13 17:09:31 +03:00
|
|
|
Nexra, Bixin123, Liaobots, Airforce, Bing
|
2024-07-25 09:21:55 +03:00
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
gpt_4 = Model(
|
|
|
|
name = 'gpt-4',
|
2024-09-04 02:09:29 +03:00
|
|
|
base_provider = 'OpenAI',
|
2024-07-25 09:21:55 +03:00
|
|
|
best_provider = IterListProvider([
|
2024-09-24 13:23:53 +03:00
|
|
|
Nexra, Binjie, Airforce,
|
|
|
|
gpt_4_turbo.best_provider, gpt_4o.best_provider, gpt_4o_mini.best_provider,
|
|
|
|
Chatgpt4Online, Bing, OpenaiChat,
|
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
|
|
|
### GigaChat ###
|
2024-03-14 01:29:49 +03:00
|
|
|
gigachat = Model(
|
|
|
|
name = 'GigaChat:latest',
|
|
|
|
base_provider = 'gigachat',
|
|
|
|
best_provider = GigaChat
|
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
|
|
|
### Meta ###
|
2024-05-19 06:09:55 +03:00
|
|
|
meta = Model(
|
2024-08-31 09:47:39 +03:00
|
|
|
name = "meta-ai",
|
2024-09-03 00:35:52 +03:00
|
|
|
base_provider = "Meta",
|
2024-05-19 06:09:55 +03:00
|
|
|
best_provider = MetaAI
|
2024-04-19 10:27:33 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
# llama 2
|
2024-09-13 17:09:31 +03:00
|
|
|
llama_2_13b = Model(
|
|
|
|
name = "llama-2-13b",
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = "Meta Llama",
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
# llama 3
|
2024-08-31 09:47:39 +03:00
|
|
|
llama_3_8b = Model(
|
|
|
|
name = "llama-3-8b",
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = "Meta Llama",
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce, DeepInfra, Replicate])
|
2024-04-19 10:27:33 +03:00
|
|
|
)
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
llama_3_70b = Model(
|
|
|
|
name = "llama-3-70b",
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = "Meta Llama",
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([ReplicateHome, Airforce, DeepInfra, Replicate])
|
2024-07-25 09:21:55 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
llama_3 = Model(
|
|
|
|
name = "llama-3",
|
|
|
|
base_provider = "Meta Llama",
|
|
|
|
best_provider = IterListProvider([llama_3_8b.best_provider, llama_3_70b.best_provider])
|
|
|
|
)
|
|
|
|
|
|
|
|
# llama 3.1
|
2024-08-31 09:47:39 +03:00
|
|
|
llama_3_1_8b = Model(
|
|
|
|
name = "llama-3.1-8b",
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = "Meta Llama",
|
|
|
|
best_provider = IterListProvider([Blackbox, DeepInfraChat, Airforce, PerplexityLabs])
|
2024-07-25 09:21:55 +03:00
|
|
|
)
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
llama_3_1_70b = Model(
|
|
|
|
name = "llama-3.1-70b",
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = "Meta Llama",
|
|
|
|
best_provider = IterListProvider([DDG, HuggingChat, Blackbox, FreeGpt, TeachAnything, Free2GPT, DeepInfraChat, Airforce, HuggingFace, PerplexityLabs])
|
2024-01-23 07:02:14 +03:00
|
|
|
)
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
llama_3_1_405b = Model(
|
|
|
|
name = "llama-3.1-405b",
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = "Meta Llama",
|
|
|
|
best_provider = IterListProvider([Blackbox, DeepInfraChat, Airforce])
|
|
|
|
)
|
|
|
|
|
|
|
|
llama_3_1 = Model(
|
|
|
|
name = "llama-3.1",
|
|
|
|
base_provider = "Meta Llama",
|
|
|
|
best_provider = IterListProvider([llama_3_1_8b.best_provider, llama_3_1_70b.best_provider, llama_3_1_405b.best_provider,])
|
2024-01-01 19:48:57 +03:00
|
|
|
)
|
2023-10-26 22:32:49 +03:00
|
|
|
|
2024-09-12 22:11:01 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
### Mistral ###
|
2024-09-13 17:09:31 +03:00
|
|
|
mistral_7b = Model(
|
|
|
|
name = "mistral-7b",
|
|
|
|
base_provider = "Mistral",
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([HuggingChat, DeepInfraChat, Airforce, HuggingFace, DeepInfra])
|
2024-09-13 17:09:31 +03:00
|
|
|
)
|
|
|
|
|
2023-12-13 15:15:27 +03:00
|
|
|
mixtral_8x7b = Model(
|
2024-08-31 09:47:39 +03:00
|
|
|
name = "mixtral-8x7b",
|
2024-09-03 00:35:52 +03:00
|
|
|
base_provider = "Mistral",
|
2024-09-26 22:40:40 +03:00
|
|
|
best_provider = IterListProvider([DDG, ReplicateHome, DeepInfraChat, Airforce, DeepInfra])
|
2024-04-12 06:18:08 +03:00
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
mixtral_8x22b = Model(
|
|
|
|
name = "mixtral-8x22b",
|
2024-09-03 00:35:52 +03:00
|
|
|
base_provider = "Mistral",
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([DeepInfraChat, Airforce])
|
2024-07-08 23:41:19 +03:00
|
|
|
)
|
|
|
|
|
2024-09-25 20:05:39 +03:00
|
|
|
mistral_nemo = Model(
|
|
|
|
name = "mistral-nemo",
|
|
|
|
base_provider = "Mistral",
|
|
|
|
best_provider = IterListProvider([HuggingChat, HuggingFace])
|
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-09-12 22:11:01 +03:00
|
|
|
### NousResearch ###
|
|
|
|
mixtral_8x7b_dpo = Model(
|
|
|
|
name = "mixtral-8x7b-dpo",
|
|
|
|
base_provider = "NousResearch",
|
2024-09-25 20:05:39 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
2024-09-13 17:09:31 +03:00
|
|
|
)
|
|
|
|
|
2024-09-25 20:05:39 +03:00
|
|
|
hermes_3 = Model(
|
|
|
|
name = "hermes-3",
|
|
|
|
base_provider = "NousResearch",
|
2024-09-12 21:52:25 +03:00
|
|
|
best_provider = IterListProvider([HuggingChat, HuggingFace])
|
2024-01-01 19:48:57 +03:00
|
|
|
)
|
2023-12-13 15:15:27 +03:00
|
|
|
|
2024-09-25 20:05:39 +03:00
|
|
|
|
|
|
|
### Microsoft ###
|
2024-09-24 13:23:53 +03:00
|
|
|
phi_3_medium_4k = Model(
|
|
|
|
name = "phi-3-medium-4k",
|
|
|
|
base_provider = "Microsoft",
|
|
|
|
best_provider = IterListProvider([DeepInfraChat])
|
|
|
|
)
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-09-25 20:05:39 +03:00
|
|
|
phi_3_5_mini = Model(
|
|
|
|
name = "phi-3.5-mini",
|
|
|
|
base_provider = "Microsoft",
|
|
|
|
best_provider = IterListProvider([HuggingChat, HuggingFace])
|
|
|
|
)
|
2024-09-24 13:23:53 +03:00
|
|
|
|
|
|
|
### Google DeepMind ###
|
2024-07-08 23:41:19 +03:00
|
|
|
# gemini
|
|
|
|
gemini_pro = Model(
|
|
|
|
name = 'gemini-pro',
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = 'Google DeepMind',
|
2024-09-27 00:24:44 +03:00
|
|
|
best_provider = IterListProvider([GeminiPro, LiteIcoding, Blackbox, AIChatFree, Liaobots, Airforce])
|
2024-07-25 09:21:55 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
gemini_flash = Model(
|
|
|
|
name = 'gemini-flash',
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = 'Google DeepMind',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Blackbox, Liaobots, Airforce])
|
2024-07-29 21:48:38 +03:00
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
gemini = Model(
|
|
|
|
name = 'gemini',
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = 'Google DeepMind',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([
|
|
|
|
Gemini,
|
|
|
|
gemini_flash.best_provider, gemini_pro.best_provider
|
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
# gemma
|
2024-09-13 17:09:31 +03:00
|
|
|
gemma_2b_9b = Model(
|
|
|
|
name = 'gemma-2b-9b',
|
|
|
|
base_provider = 'Google',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
)
|
|
|
|
|
|
|
|
gemma_2b_27b = Model(
|
|
|
|
name = 'gemma-2b-27b',
|
|
|
|
base_provider = 'Google',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([DeepInfraChat, Airforce])
|
2024-07-25 09:21:55 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
gemma_2b = Model(
|
|
|
|
name = 'gemma-2b',
|
|
|
|
base_provider = 'Google',
|
|
|
|
best_provider = IterListProvider([
|
|
|
|
ReplicateHome, Airforce,
|
|
|
|
gemma_2b_9b.best_provider, gemma_2b_27b.best_provider,
|
|
|
|
])
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
### Anthropic ###
|
2024-07-25 09:21:55 +03:00
|
|
|
claude_2 = Model(
|
|
|
|
name = 'claude-2',
|
|
|
|
base_provider = 'Anthropic',
|
|
|
|
best_provider = IterListProvider([You])
|
|
|
|
)
|
|
|
|
|
|
|
|
claude_2_0 = Model(
|
|
|
|
name = 'claude-2.0',
|
|
|
|
base_provider = 'Anthropic',
|
|
|
|
best_provider = IterListProvider([Liaobots])
|
|
|
|
)
|
|
|
|
|
|
|
|
claude_2_1 = Model(
|
|
|
|
name = 'claude-2.1',
|
|
|
|
base_provider = 'Anthropic',
|
|
|
|
best_provider = IterListProvider([Liaobots])
|
2024-01-23 07:02:14 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
# claude 3
|
2024-03-11 04:41:59 +03:00
|
|
|
claude_3_opus = Model(
|
|
|
|
name = 'claude-3-opus',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Anthropic',
|
2024-08-31 09:47:39 +03:00
|
|
|
best_provider = IterListProvider([Liaobots])
|
2024-03-11 04:41:59 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
claude_3_sonnet = Model(
|
|
|
|
name = 'claude-3-sonnet',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Anthropic',
|
2024-08-31 09:47:39 +03:00
|
|
|
best_provider = IterListProvider([Liaobots])
|
2024-07-25 09:21:55 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
claude_3_haiku = Model(
|
|
|
|
name = 'claude-3-haiku',
|
|
|
|
base_provider = 'Anthropic',
|
|
|
|
best_provider = IterListProvider([DDG, Liaobots])
|
|
|
|
)
|
|
|
|
|
|
|
|
claude_3 = Model(
|
|
|
|
name = 'claude-3',
|
|
|
|
base_provider = 'Anthropic',
|
|
|
|
best_provider = IterListProvider([
|
|
|
|
claude_3_opus.best_provider, claude_3_sonnet.best_provider, claude_3_haiku.best_provider
|
|
|
|
])
|
|
|
|
)
|
|
|
|
|
|
|
|
# claude 3.5
|
2024-07-25 09:21:55 +03:00
|
|
|
claude_3_5_sonnet = Model(
|
2024-09-24 13:23:53 +03:00
|
|
|
name = 'claude-3.5-sonnet',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Anthropic',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([Blackbox, Liaobots])
|
2024-03-11 04:41:59 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
claude_3_5 = Model(
|
|
|
|
name = 'claude-3.5',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Anthropic',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([
|
|
|
|
LiteIcoding,
|
|
|
|
claude_3_5_sonnet.best_provider
|
|
|
|
])
|
2024-07-29 21:48:38 +03:00
|
|
|
)
|
|
|
|
|
2023-09-20 06:00:19 +03:00
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
### Reka AI ###
|
|
|
|
reka_core = Model(
|
|
|
|
name = 'reka-core',
|
|
|
|
base_provider = 'Reka AI',
|
|
|
|
best_provider = Reka
|
2023-10-10 16:11:17 +03:00
|
|
|
)
|
2023-09-22 22:36:44 +03:00
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
### Blackbox AI ###
|
2024-07-08 23:41:19 +03:00
|
|
|
blackbox = Model(
|
|
|
|
name = 'blackbox',
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = 'Blackbox AI',
|
|
|
|
best_provider = IterListProvider([Blackbox])
|
2023-10-07 20:10:26 +03:00
|
|
|
)
|
2023-09-29 17:21:18 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
|
|
|
### Databricks ###
|
|
|
|
dbrx_instruct = Model(
|
2024-08-31 09:47:39 +03:00
|
|
|
name = 'dbrx-instruct',
|
2024-07-08 23:41:19 +03:00
|
|
|
base_provider = 'Databricks',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce, DeepInfra])
|
2023-10-07 20:10:26 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
|
|
|
### CohereForAI ###
|
|
|
|
command_r_plus = Model(
|
2024-08-31 09:47:39 +03:00
|
|
|
name = 'command-r-plus',
|
2024-07-08 23:41:19 +03:00
|
|
|
base_provider = 'CohereForAI',
|
|
|
|
best_provider = IterListProvider([HuggingChat])
|
2024-01-13 17:58:12 +03:00
|
|
|
)
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-07-25 09:21:55 +03:00
|
|
|
### iFlytek ###
|
2024-08-31 09:47:39 +03:00
|
|
|
sparkdesk_v1_1 = Model(
|
|
|
|
name = 'sparkdesk-v1.1',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'iFlytek',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([FreeChatgpt, Airforce])
|
2024-07-25 09:21:55 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
2024-07-25 09:21:55 +03:00
|
|
|
### Qwen ###
|
2024-08-31 09:47:39 +03:00
|
|
|
qwen_1_5_14b = Model(
|
|
|
|
name = 'qwen-1.5-14b',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Qwen',
|
|
|
|
best_provider = IterListProvider([FreeChatgpt])
|
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
qwen_1_5_72b = Model(
|
|
|
|
name = 'qwen-1.5-72b',
|
|
|
|
base_provider = 'Qwen',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
)
|
|
|
|
|
|
|
|
qwen_1_5_110b = Model(
|
|
|
|
name = 'qwen-1.5-110b',
|
|
|
|
base_provider = 'Qwen',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
)
|
|
|
|
|
|
|
|
qwen_2_72b = Model(
|
|
|
|
name = 'qwen-2-72b',
|
|
|
|
base_provider = 'Qwen',
|
2024-09-25 08:01:39 +03:00
|
|
|
best_provider = IterListProvider([DeepInfraChat, HuggingChat, Airforce, HuggingFace])
|
2024-09-13 17:09:31 +03:00
|
|
|
)
|
|
|
|
|
2024-09-06 19:32:18 +03:00
|
|
|
qwen_turbo = Model(
|
|
|
|
name = 'qwen-turbo',
|
|
|
|
base_provider = 'Qwen',
|
|
|
|
best_provider = IterListProvider([Bixin123])
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
qwen = Model(
|
|
|
|
name = 'qwen',
|
|
|
|
base_provider = 'Qwen',
|
|
|
|
best_provider = IterListProvider([
|
|
|
|
qwen_1_5_14b.best_provider, qwen_1_5_72b.best_provider, qwen_1_5_110b.best_provider, qwen_2_72b.best_provider, qwen_turbo.best_provider
|
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2024-07-25 09:21:55 +03:00
|
|
|
|
|
|
|
### Zhipu AI ###
|
2024-09-06 21:14:35 +03:00
|
|
|
glm_3_6b = Model(
|
|
|
|
name = 'glm-3-6b',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Zhipu AI',
|
|
|
|
best_provider = IterListProvider([FreeChatgpt])
|
|
|
|
)
|
|
|
|
|
2024-09-06 21:14:35 +03:00
|
|
|
glm_4_9b = Model(
|
|
|
|
name = 'glm-4-9B',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Zhipu AI',
|
|
|
|
best_provider = IterListProvider([FreeChatgpt])
|
|
|
|
)
|
|
|
|
|
2024-09-06 21:14:35 +03:00
|
|
|
glm_4 = Model(
|
|
|
|
name = 'glm-4',
|
2024-09-06 20:59:59 +03:00
|
|
|
base_provider = 'Zhipu AI',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([
|
|
|
|
glm_3_6b.best_provider, glm_4_9b.best_provider
|
|
|
|
])
|
2024-09-06 20:59:59 +03:00
|
|
|
)
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
2024-07-25 09:21:55 +03:00
|
|
|
### 01-ai ###
|
2024-08-31 09:47:39 +03:00
|
|
|
yi_1_5_9b = Model(
|
|
|
|
name = 'yi-1.5-9b',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = '01-ai',
|
|
|
|
best_provider = IterListProvider([FreeChatgpt])
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
yi_34b = Model(
|
|
|
|
name = 'yi-34b',
|
|
|
|
base_provider = '01-ai',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
)
|
|
|
|
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
### Upstage ###
|
2024-08-31 09:47:39 +03:00
|
|
|
solar_1_mini = Model(
|
|
|
|
name = 'solar-1-mini',
|
|
|
|
base_provider = 'Upstage',
|
|
|
|
best_provider = IterListProvider([Upstage])
|
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
solar_10_7b = Model(
|
|
|
|
name = 'solar-10-7b',
|
|
|
|
base_provider = 'Upstage',
|
|
|
|
best_provider = Airforce
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
solar_pro = Model(
|
|
|
|
name = 'solar-pro',
|
|
|
|
base_provider = 'Upstage',
|
|
|
|
best_provider = Upstage
|
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
### Inflection ###
|
2023-12-02 01:11:52 +03:00
|
|
|
pi = Model(
|
|
|
|
name = 'pi',
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = 'Inflection',
|
2024-01-23 03:47:55 +03:00
|
|
|
best_provider = Pi
|
2023-12-02 01:11:52 +03:00
|
|
|
)
|
2023-09-18 00:23:54 +03:00
|
|
|
|
2024-09-06 20:59:59 +03:00
|
|
|
### DeepSeek ###
|
|
|
|
deepseek = Model(
|
|
|
|
name = 'deepseek',
|
|
|
|
base_provider = 'DeepSeek',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
2024-09-06 20:59:59 +03:00
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
### WizardLM ###
|
2024-09-24 13:23:53 +03:00
|
|
|
wizardlm_2_7b = Model(
|
|
|
|
name = 'wizardlm-2-7b',
|
|
|
|
base_provider = 'WizardLM',
|
|
|
|
best_provider = IterListProvider([DeepInfraChat])
|
|
|
|
)
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
wizardlm_2_8x22b = Model(
|
|
|
|
name = 'wizardlm-2-8x22b',
|
|
|
|
base_provider = 'WizardLM',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([DeepInfraChat, Airforce])
|
2024-09-13 17:09:31 +03:00
|
|
|
)
|
2024-09-04 02:09:29 +03:00
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
### Together ###
|
|
|
|
sh_n_7b = Model(
|
|
|
|
name = 'sh-n-7b',
|
|
|
|
base_provider = 'Together',
|
|
|
|
best_provider = Airforce
|
|
|
|
)
|
2024-04-13 05:09:11 +03:00
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
2024-09-15 22:02:06 +03:00
|
|
|
### Yorickvp ###
|
|
|
|
llava_13b = Model(
|
|
|
|
name = 'llava-13b',
|
|
|
|
base_provider = 'Yorickvp',
|
|
|
|
best_provider = ReplicateHome
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
|
|
|
### OpenBMB ###
|
|
|
|
minicpm_llama_3_v2_5 = Model(
|
|
|
|
name = 'minicpm-llama-3-v2.5',
|
|
|
|
base_provider = 'OpenBMB',
|
|
|
|
best_provider = DeepInfraChat
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
### Lzlv ###
|
|
|
|
lzlv_70b = Model(
|
|
|
|
name = 'lzlv-70b',
|
|
|
|
base_provider = 'Lzlv',
|
|
|
|
best_provider = DeepInfraChat
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
### OpenChat ###
|
|
|
|
openchat_3_6_8b = Model(
|
|
|
|
name = 'openchat-3.6-8b',
|
|
|
|
base_provider = 'OpenChat',
|
|
|
|
best_provider = DeepInfraChat
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
### Phind ###
|
|
|
|
phind_codellama_34b_v2 = Model(
|
|
|
|
name = 'phind-codellama-34b-v2',
|
|
|
|
base_provider = 'Phind',
|
|
|
|
best_provider = DeepInfraChat
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
### Cognitive Computations ###
|
|
|
|
dolphin_2_9_1_llama_3_70b = Model(
|
|
|
|
name = 'dolphin-2.9.1-llama-3-70b',
|
|
|
|
base_provider = 'Cognitive Computations',
|
|
|
|
best_provider = DeepInfraChat
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
### x.ai ###
|
|
|
|
grok_2 = Model(
|
|
|
|
name = 'grok-2',
|
|
|
|
base_provider = 'x.ai',
|
|
|
|
best_provider = Liaobots
|
|
|
|
)
|
|
|
|
|
|
|
|
grok_2_mini = Model(
|
|
|
|
name = 'grok-2-mini',
|
|
|
|
base_provider = 'x.ai',
|
|
|
|
best_provider = Liaobots
|
|
|
|
)
|
|
|
|
|
|
|
|
|
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
#############
|
|
|
|
### Image ###
|
|
|
|
#############
|
2024-04-13 04:46:20 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
### Stability AI ###
|
|
|
|
sdxl = Model(
|
2024-08-31 09:47:39 +03:00
|
|
|
name = 'sdxl',
|
2024-07-08 23:41:19 +03:00
|
|
|
base_provider = 'Stability AI',
|
2024-08-31 09:47:39 +03:00
|
|
|
best_provider = IterListProvider([ReplicateHome, DeepInfraImage])
|
2024-07-25 09:21:55 +03:00
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
sd_3 = Model(
|
|
|
|
name = 'sd-3',
|
2024-07-25 09:21:55 +03:00
|
|
|
base_provider = 'Stability AI',
|
|
|
|
best_provider = IterListProvider([ReplicateHome])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Playground ###
|
|
|
|
playground_v2_5 = Model(
|
|
|
|
name = 'playground-v2.5',
|
2024-09-24 13:23:53 +03:00
|
|
|
base_provider = 'Playground AI',
|
2024-07-25 09:21:55 +03:00
|
|
|
best_provider = IterListProvider([ReplicateHome])
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-04-19 15:10:56 +03:00
|
|
|
)
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Flux AI ###
|
|
|
|
flux = Model(
|
|
|
|
name = 'flux',
|
|
|
|
base_provider = 'Flux AI',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([Airforce, Blackbox])
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
flux_realism = Model(
|
|
|
|
name = 'flux-realism',
|
|
|
|
base_provider = 'Flux AI',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
flux_anime = Model(
|
|
|
|
name = 'flux-anime',
|
|
|
|
base_provider = 'Flux AI',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
flux_3d = Model(
|
|
|
|
name = 'flux-3d',
|
|
|
|
base_provider = 'Flux AI',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
flux_disney = Model(
|
|
|
|
name = 'flux-disney',
|
|
|
|
base_provider = 'Flux AI',
|
2024-09-13 17:09:31 +03:00
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
|
|
|
flux_pixel = Model(
|
|
|
|
name = 'flux-pixel',
|
|
|
|
base_provider = 'Flux AI',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-04-25 02:06:11 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
flux_4o = Model(
|
|
|
|
name = 'flux-4o',
|
|
|
|
base_provider = 'Flux AI',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-09-15 22:02:06 +03:00
|
|
|
flux_schnell = Model(
|
|
|
|
name = 'flux-schnell',
|
|
|
|
base_provider = 'Flux AI',
|
|
|
|
best_provider = IterListProvider([ReplicateHome])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
|
2024-09-04 22:23:17 +03:00
|
|
|
### ###
|
2024-09-24 13:23:53 +03:00
|
|
|
dalle_2 = Model(
|
|
|
|
name = 'dalle-2',
|
2024-09-04 22:23:17 +03:00
|
|
|
base_provider = '',
|
|
|
|
best_provider = IterListProvider([Nexra])
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
)
|
|
|
|
dalle_3 = Model(
|
|
|
|
name = 'dalle-3',
|
|
|
|
base_provider = '',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
|
2024-09-04 22:23:17 +03:00
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
dalle = Model(
|
|
|
|
name = 'dalle',
|
2024-09-11 16:59:02 +03:00
|
|
|
base_provider = '',
|
2024-09-24 13:23:53 +03:00
|
|
|
best_provider = IterListProvider([
|
|
|
|
Nexra,
|
|
|
|
dalle_2.best_provider, dalle_3.best_provider,
|
|
|
|
])
|
2024-09-11 16:59:02 +03:00
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-09-04 22:23:17 +03:00
|
|
|
dalle_mini = Model(
|
|
|
|
name = 'dalle-mini',
|
|
|
|
base_provider = '',
|
|
|
|
best_provider = IterListProvider([Nexra])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
### ###
|
2024-09-04 22:23:17 +03:00
|
|
|
emi = Model(
|
|
|
|
name = 'emi',
|
|
|
|
base_provider = '',
|
|
|
|
best_provider = IterListProvider([Nexra])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
2024-09-13 21:03:24 +03:00
|
|
|
any_dark = Model(
|
|
|
|
name = 'any-dark',
|
|
|
|
base_provider = '',
|
|
|
|
best_provider = IterListProvider([Airforce])
|
|
|
|
|
|
|
|
)
|
|
|
|
|
2023-09-18 00:23:54 +03:00
|
|
|
class ModelUtils:
|
2024-01-14 09:45:41 +03:00
|
|
|
"""
|
|
|
|
Utility class for mapping string identifiers to Model instances.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
convert (dict[str, Model]): Dictionary mapping model string identifiers to Model instances.
|
|
|
|
"""
|
2023-09-18 00:23:54 +03:00
|
|
|
convert: dict[str, Model] = {
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
############
|
|
|
|
### Text ###
|
|
|
|
############
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### OpenAI ###
|
2024-09-04 02:09:29 +03:00
|
|
|
# gpt-3
|
|
|
|
'gpt-3': gpt_3,
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
# gpt-3.5
|
|
|
|
'gpt-3.5-turbo': gpt_35_turbo,
|
2024-07-29 01:37:16 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
# gpt-4
|
2024-09-24 13:23:53 +03:00
|
|
|
'gpt-4o': gpt_4o,
|
|
|
|
'gpt-4o-mini': gpt_4o_mini,
|
|
|
|
'gpt-4': gpt_4,
|
|
|
|
'gpt-4-turbo': gpt_4_turbo,
|
2024-09-27 00:24:44 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Meta ###
|
|
|
|
"meta-ai": meta,
|
|
|
|
|
2024-09-13 17:09:31 +03:00
|
|
|
# llama-2
|
|
|
|
'llama-2-13b': llama_2_13b,
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
# llama-3
|
2024-09-24 13:23:53 +03:00
|
|
|
'llama-3': llama_3,
|
2024-08-31 09:47:39 +03:00
|
|
|
'llama-3-8b': llama_3_8b,
|
|
|
|
'llama-3-70b': llama_3_70b,
|
2024-08-16 23:25:38 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
# llama-3.1
|
2024-09-24 13:23:53 +03:00
|
|
|
'llama-3.1': llama_3_1,
|
2024-08-31 09:47:39 +03:00
|
|
|
'llama-3.1-8b': llama_3_1_8b,
|
|
|
|
'llama-3.1-70b': llama_3_1_70b,
|
|
|
|
'llama-3.1-405b': llama_3_1_405b,
|
2024-09-13 17:09:31 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Mistral ###
|
|
|
|
'mistral-7b': mistral_7b,
|
2024-09-13 17:09:31 +03:00
|
|
|
'mixtral-8x7b': mixtral_8x7b,
|
|
|
|
'mixtral-8x22b': mixtral_8x22b,
|
2024-09-25 20:05:39 +03:00
|
|
|
'mistral-nemo': mistral_nemo,
|
2024-09-12 22:12:47 +03:00
|
|
|
|
|
|
|
|
|
|
|
### NousResearch ###
|
2024-09-25 20:05:39 +03:00
|
|
|
'mixtral-8x7b-dpo': mixtral_8x7b_dpo,
|
|
|
|
'hermes-3': hermes_3,
|
2024-09-13 17:09:31 +03:00
|
|
|
|
|
|
|
'yi-34b': yi_34b,
|
|
|
|
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Microsoft ###
|
2024-09-24 13:23:53 +03:00
|
|
|
'phi_3_medium-4k': phi_3_medium_4k,
|
2024-09-25 20:05:39 +03:00
|
|
|
'phi-3.5-mini': phi_3_5_mini,
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
### Google ###
|
|
|
|
# gemini
|
|
|
|
'gemini': gemini,
|
|
|
|
'gemini-pro': gemini_pro,
|
|
|
|
'gemini-flash': gemini_flash,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
# gemma
|
|
|
|
'gemma-2b': gemma_2b,
|
2024-09-13 17:09:31 +03:00
|
|
|
'gemma-2b-9b': gemma_2b_9b,
|
|
|
|
'gemma-2b-27b': gemma_2b_27b,
|
2024-07-29 01:37:16 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
### Anthropic ###
|
|
|
|
'claude-2': claude_2,
|
|
|
|
'claude-2.0': claude_2_0,
|
|
|
|
'claude-2.1': claude_2_1,
|
2024-09-24 13:23:53 +03:00
|
|
|
|
|
|
|
# claude 3
|
|
|
|
'claude-3': claude_3,
|
2024-08-31 09:47:39 +03:00
|
|
|
'claude-3-opus': claude_3_opus,
|
|
|
|
'claude-3-sonnet': claude_3_sonnet,
|
|
|
|
'claude-3-haiku': claude_3_haiku,
|
2024-09-24 13:23:53 +03:00
|
|
|
|
|
|
|
# claude 3.5
|
|
|
|
'claude-3.5': claude_3_5,
|
|
|
|
'claude-3.5-sonnet': claude_3_5_sonnet,
|
2024-07-29 21:48:38 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
### Reka AI ###
|
|
|
|
'reka-core': reka_core,
|
|
|
|
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
### Blackbox AI ###
|
2024-08-31 09:47:39 +03:00
|
|
|
'blackbox': blackbox,
|
2024-07-29 21:48:38 +03:00
|
|
|
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### CohereForAI ###
|
|
|
|
'command-r+': command_r_plus,
|
|
|
|
|
|
|
|
|
|
|
|
### Databricks ###
|
|
|
|
'dbrx-instruct': dbrx_instruct,
|
2024-07-29 01:37:16 +03:00
|
|
|
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### GigaChat ###
|
|
|
|
'gigachat': gigachat,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### iFlytek ###
|
|
|
|
'sparkdesk-v1.1': sparkdesk_v1_1,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Qwen ###
|
2024-09-24 13:23:53 +03:00
|
|
|
'qwen': qwen,
|
2024-08-31 09:47:39 +03:00
|
|
|
'qwen-1.5-14b': qwen_1_5_14b,
|
2024-09-13 17:09:31 +03:00
|
|
|
'qwen-1.5-72b': qwen_1_5_72b,
|
|
|
|
'qwen-1.5-110b': qwen_1_5_110b,
|
|
|
|
'qwen-2-72b': qwen_2_72b,
|
2024-09-06 19:32:18 +03:00
|
|
|
'qwen-turbo': qwen_turbo,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Zhipu AI ###
|
2024-09-06 21:14:35 +03:00
|
|
|
'glm-3-6b': glm_3_6b,
|
|
|
|
'glm-4-9b': glm_4_9b,
|
|
|
|
'glm-4': glm_4,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### 01-ai ###
|
|
|
|
'yi-1.5-9b': yi_1_5_9b,
|
2024-07-08 23:41:19 +03:00
|
|
|
|
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
### Upstage ###
|
|
|
|
'solar-1-mini': solar_1_mini,
|
2024-09-13 17:09:31 +03:00
|
|
|
'solar-10-7b': solar_10_7b,
|
2024-09-24 13:23:53 +03:00
|
|
|
'solar-pro': solar_pro,
|
2024-08-31 09:47:39 +03:00
|
|
|
|
|
|
|
|
2024-09-24 13:23:53 +03:00
|
|
|
### Inflection ###
|
2024-08-31 09:47:39 +03:00
|
|
|
'pi': pi,
|
2024-09-04 02:09:29 +03:00
|
|
|
|
2024-09-06 20:59:59 +03:00
|
|
|
### DeepSeek ###
|
|
|
|
'deepseek': deepseek,
|
2024-09-13 17:09:31 +03:00
|
|
|
|
|
|
|
|
|
|
|
### Together ###
|
|
|
|
'sh-n-7b': sh_n_7b,
|
2024-09-15 22:02:06 +03:00
|
|
|
|
|
|
|
|
|
|
|
### Yorickvp ###
|
|
|
|
'llava-13b': llava_13b,
|
2024-09-24 13:23:53 +03:00
|
|
|
|
|
|
|
|
|
|
|
### WizardLM ###
|
|
|
|
'wizardlm-2-7b': wizardlm_2_7b,
|
|
|
|
'wizardlm-2-8x22b': wizardlm_2_8x22b,
|
|
|
|
|
|
|
|
|
|
|
|
### OpenBMB ###
|
|
|
|
'minicpm-llama-3-v2.5': minicpm_llama_3_v2_5,
|
|
|
|
|
|
|
|
|
|
|
|
### Lzlv ###
|
|
|
|
'lzlv-70b': lzlv_70b,
|
|
|
|
|
|
|
|
|
|
|
|
### OpenChat ###
|
|
|
|
'openchat-3.6-8b': openchat_3_6_8b,
|
|
|
|
|
|
|
|
|
|
|
|
### Phind ###
|
|
|
|
'phind-codellama-34b-v2': phind_codellama_34b_v2,
|
|
|
|
|
|
|
|
|
|
|
|
### Cognitive Computations ###
|
|
|
|
'dolphin-2.9.1-llama-3-70b': dolphin_2_9_1_llama_3_70b,
|
|
|
|
|
|
|
|
|
|
|
|
### x.ai ###
|
|
|
|
'grok-2': grok_2,
|
|
|
|
'grok-2-mini': grok_2_mini,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-07-08 23:41:19 +03:00
|
|
|
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-08-31 09:47:39 +03:00
|
|
|
#############
|
|
|
|
### Image ###
|
|
|
|
#############
|
|
|
|
|
|
|
|
### Stability AI ###
|
|
|
|
'sdxl': sdxl,
|
|
|
|
'sd-3': sd_3,
|
|
|
|
|
|
|
|
|
|
|
|
### Playground ###
|
|
|
|
'playground-v2.5': playground_v2_5,
|
|
|
|
|
|
|
|
|
|
|
|
### Flux AI ###
|
|
|
|
'flux': flux,
|
|
|
|
'flux-realism': flux_realism,
|
|
|
|
'flux-anime': flux_anime,
|
|
|
|
'flux-3d': flux_3d,
|
|
|
|
'flux-disney': flux_disney,
|
2024-09-13 17:09:31 +03:00
|
|
|
'flux-pixel': flux_pixel,
|
2024-09-24 13:23:53 +03:00
|
|
|
'flux-4o': flux_4o,
|
2024-09-15 22:02:06 +03:00
|
|
|
'flux-schnell': flux_schnell,
|
2024-07-25 09:21:55 +03:00
|
|
|
|
2024-09-04 22:23:17 +03:00
|
|
|
|
|
|
|
### ###
|
|
|
|
'dalle': dalle,
|
2024-09-11 16:59:02 +03:00
|
|
|
'dalle-2': dalle_2,
|
2024-09-24 13:23:53 +03:00
|
|
|
'dalle-3': dalle_3,
|
2024-09-04 22:23:17 +03:00
|
|
|
'dalle-mini': dalle_mini,
|
|
|
|
'emi': emi,
|
2024-09-13 21:03:24 +03:00
|
|
|
'any-dark': any_dark,
|
2023-10-01 05:27:21 +03:00
|
|
|
}
|
2023-10-19 17:14:48 +03:00
|
|
|
|
2024-02-04 21:50:32 +03:00
|
|
|
_all_models = list(ModelUtils.convert.keys())
|