mirror of
https://github.com/xtekky/gpt4free.git
synced 2024-12-25 20:22:47 +03:00
376 lines
11 KiB
Python
376 lines
11 KiB
Python
from __future__ import annotations
|
|
import re
|
|
from aiohttp import ClientSession
|
|
import json
|
|
from typing import List
|
|
|
|
from ...typing import AsyncResult, Messages
|
|
from ..base_provider import AsyncGeneratorProvider, ProviderModelMixin
|
|
from ..helper import format_prompt
|
|
|
|
def clean_response(text: str) -> str:
|
|
"""Clean response from unwanted patterns."""
|
|
patterns = [
|
|
r"One message exceeds the \d+chars per message limit\..+https:\/\/discord\.com\/invite\/\S+",
|
|
r"Rate limit \(\d+\/minute\) exceeded\. Join our discord for more: .+https:\/\/discord\.com\/invite\/\S+",
|
|
r"Rate limit \(\d+\/hour\) exceeded\. Join our discord for more: https:\/\/discord\.com\/invite\/\S+",
|
|
r"</s>", # zephyr-7b-beta
|
|
]
|
|
|
|
for pattern in patterns:
|
|
text = re.sub(pattern, '', text)
|
|
return text.strip()
|
|
|
|
def split_message(message: dict, chunk_size: int = 995) -> List[dict]:
|
|
"""Split a message into chunks of specified size."""
|
|
content = message.get('content', '')
|
|
if len(content) <= chunk_size:
|
|
return [message]
|
|
|
|
chunks = []
|
|
while content:
|
|
chunk = content[:chunk_size]
|
|
content = content[chunk_size:]
|
|
chunks.append({
|
|
'role': message['role'],
|
|
'content': chunk
|
|
})
|
|
return chunks
|
|
|
|
def split_messages(messages: Messages, chunk_size: int = 995) -> Messages:
|
|
"""Split all messages that exceed chunk_size into smaller messages."""
|
|
result = []
|
|
for message in messages:
|
|
result.extend(split_message(message, chunk_size))
|
|
return result
|
|
|
|
class AirforceChat(AsyncGeneratorProvider, ProviderModelMixin):
|
|
label = "AirForce Chat"
|
|
api_endpoint_completions = "https://api.airforce/chat/completions" # Замініть на реальний ендпоінт
|
|
supports_stream = True
|
|
supports_system_message = True
|
|
supports_message_history = True
|
|
|
|
default_model = 'llama-3-70b-chat'
|
|
text_models = [
|
|
# anthropic
|
|
'claude-3-haiku-20240307',
|
|
'claude-3-sonnet-20240229',
|
|
'claude-3-5-sonnet-20240620',
|
|
'claude-3-5-sonnet-20241022',
|
|
'claude-3-opus-20240229',
|
|
|
|
# openai
|
|
'chatgpt-4o-latest',
|
|
'gpt-4',
|
|
'gpt-4-turbo',
|
|
'gpt-4o-2024-05-13',
|
|
'gpt-4o-mini-2024-07-18',
|
|
'gpt-4o-mini',
|
|
'gpt-4o-2024-08-06',
|
|
'gpt-3.5-turbo',
|
|
'gpt-3.5-turbo-0125',
|
|
'gpt-3.5-turbo-1106',
|
|
'gpt-4o',
|
|
'gpt-4-turbo-2024-04-09',
|
|
'gpt-4-0125-preview',
|
|
'gpt-4-1106-preview',
|
|
|
|
# meta-llama
|
|
default_model,
|
|
'llama-3-70b-chat-turbo',
|
|
'llama-3-8b-chat',
|
|
'llama-3-8b-chat-turbo',
|
|
'llama-3-70b-chat-lite',
|
|
'llama-3-8b-chat-lite',
|
|
'llama-2-13b-chat',
|
|
'llama-3.1-405b-turbo',
|
|
'llama-3.1-70b-turbo',
|
|
'llama-3.1-8b-turbo',
|
|
'LlamaGuard-2-8b',
|
|
'llamaguard-7b',
|
|
'Llama-Vision-Free',
|
|
'Llama-Guard-7b',
|
|
'Llama-3.2-90B-Vision-Instruct-Turbo',
|
|
'Meta-Llama-Guard-3-8B',
|
|
'Llama-3.2-11B-Vision-Instruct-Turbo',
|
|
'Llama-Guard-3-11B-Vision-Turbo',
|
|
'Llama-3.2-3B-Instruct-Turbo',
|
|
'Llama-3.2-1B-Instruct-Turbo',
|
|
'llama-2-7b-chat-int8',
|
|
'llama-2-7b-chat-fp16',
|
|
'Llama 3.1 405B Instruct',
|
|
'Llama 3.1 70B Instruct',
|
|
'Llama 3.1 8B Instruct',
|
|
|
|
# mistral-ai
|
|
'Mixtral-8x7B-Instruct-v0.1',
|
|
'Mixtral-8x22B-Instruct-v0.1',
|
|
'Mistral-7B-Instruct-v0.1',
|
|
'Mistral-7B-Instruct-v0.2',
|
|
'Mistral-7B-Instruct-v0.3',
|
|
|
|
# Gryphe
|
|
'MythoMax-L2-13b-Lite',
|
|
'MythoMax-L2-13b',
|
|
|
|
# openchat
|
|
'openchat-3.5-0106',
|
|
|
|
# qwen
|
|
#'Qwen1.5-72B-Chat', Пуста відповідь
|
|
#'Qwen1.5-110B-Chat', Пуста відповідь
|
|
'Qwen2-72B-Instruct',
|
|
'Qwen2.5-7B-Instruct-Turbo',
|
|
'Qwen2.5-72B-Instruct-Turbo',
|
|
|
|
# google
|
|
'gemma-2b-it',
|
|
'gemma-2-9b-it',
|
|
'gemma-2-27b-it',
|
|
|
|
# gemini
|
|
'gemini-1.5-flash',
|
|
'gemini-1.5-pro',
|
|
|
|
# databricks
|
|
'dbrx-instruct',
|
|
|
|
# deepseek-ai
|
|
'deepseek-coder-6.7b-base',
|
|
'deepseek-coder-6.7b-instruct',
|
|
'deepseek-math-7b-instruct',
|
|
|
|
# NousResearch
|
|
'deepseek-math-7b-instruct',
|
|
'Nous-Hermes-2-Mixtral-8x7B-DPO',
|
|
'hermes-2-pro-mistral-7b',
|
|
|
|
# teknium
|
|
'openhermes-2.5-mistral-7b',
|
|
|
|
# microsoft
|
|
'WizardLM-2-8x22B',
|
|
'phi-2',
|
|
|
|
# upstage
|
|
'SOLAR-10.7B-Instruct-v1.0',
|
|
|
|
# pawan
|
|
'cosmosrp',
|
|
|
|
# liquid
|
|
'lfm-40b-moe',
|
|
|
|
# DiscoResearch
|
|
'discolm-german-7b-v1',
|
|
|
|
# tiiuae
|
|
'falcon-7b-instruct',
|
|
|
|
# defog
|
|
'sqlcoder-7b-2',
|
|
|
|
# tinyllama
|
|
'tinyllama-1.1b-chat',
|
|
|
|
# HuggingFaceH4
|
|
'zephyr-7b-beta',
|
|
]
|
|
|
|
models = [*text_models]
|
|
|
|
model_aliases = {
|
|
# anthropic
|
|
"claude-3-haiku": "claude-3-haiku-20240307",
|
|
"claude-3-sonnet": "claude-3-sonnet-20240229",
|
|
"claude-3.5-sonnet": "claude-3-5-sonnet-20240620",
|
|
"claude-3.5-sonnet": "claude-3-5-sonnet-20241022",
|
|
"claude-3-opus": "claude-3-opus-20240229",
|
|
|
|
# openai
|
|
"gpt-4o": "chatgpt-4o-latest",
|
|
#"gpt-4": "gpt-4",
|
|
#"gpt-4-turbo": "gpt-4-turbo",
|
|
"gpt-4o": "gpt-4o-2024-05-13",
|
|
"gpt-4o-mini": "gpt-4o-mini-2024-07-18",
|
|
#"gpt-4o-mini": "gpt-4o-mini",
|
|
"gpt-4o": "gpt-4o-2024-08-06",
|
|
"gpt-3.5-turbo": "gpt-3.5-turbo",
|
|
"gpt-3.5-turbo": "gpt-3.5-turbo-0125",
|
|
"gpt-3.5-turbo": "gpt-3.5-turbo-1106",
|
|
#"gpt-4o": "gpt-4o",
|
|
"gpt-4-turbo": "gpt-4-turbo-2024-04-09",
|
|
"gpt-4": "gpt-4-0125-preview",
|
|
"gpt-4": "gpt-4-1106-preview",
|
|
|
|
# meta-llama
|
|
"llama-3-70b": "llama-3-70b-chat",
|
|
"llama-3-8b": "llama-3-8b-chat",
|
|
"llama-3-8b": "llama-3-8b-chat-turbo",
|
|
"llama-3-70b": "llama-3-70b-chat-lite",
|
|
"llama-3-8b": "llama-3-8b-chat-lite",
|
|
"llama-2-13b": "llama-2-13b-chat",
|
|
"llama-3.1-405b": "llama-3.1-405b-turbo",
|
|
"llama-3.1-70b": "llama-3.1-70b-turbo",
|
|
"llama-3.1-8b": "llama-3.1-8b-turbo",
|
|
"llamaguard-2-8b": "LlamaGuard-2-8b",
|
|
"llamaguard-7b": "llamaguard-7b",
|
|
#"llama_vision_free": "Llama-Vision-Free", # Unknown
|
|
"llamaguard-7b": "Llama-Guard-7b",
|
|
"llama-3.2-90b": "Llama-3.2-90B-Vision-Instruct-Turbo",
|
|
"llamaguard-3-8b": "Meta-Llama-Guard-3-8B",
|
|
"llama-3.2-11b": "Llama-3.2-11B-Vision-Instruct-Turbo",
|
|
"llamaguard-3-11b": "Llama-Guard-3-11B-Vision-Turbo",
|
|
"llama-3.2-3b": "Llama-3.2-3B-Instruct-Turbo",
|
|
"llama-3.2-1b": "Llama-3.2-1B-Instruct-Turbo",
|
|
"llama-2-7b": "llama-2-7b-chat-int8",
|
|
"llama-2-7b": "llama-2-7b-chat-fp16",
|
|
"llama-3.1-405b": "Llama 3.1 405B Instruct",
|
|
"llama-3.1-70b": "Llama 3.1 70B Instruct",
|
|
"llama-3.1-8b": "Llama 3.1 8B Instruct",
|
|
|
|
# mistral-ai
|
|
"mixtral-8x7b": "Mixtral-8x7B-Instruct-v0.1",
|
|
"mixtral-8x22b": "Mixtral-8x22B-Instruct-v0.1",
|
|
"mixtral-8x7b": "Mistral-7B-Instruct-v0.1",
|
|
"mixtral-8x7b": "Mistral-7B-Instruct-v0.2",
|
|
"mixtral-8x7b": "Mistral-7B-Instruct-v0.3",
|
|
|
|
# Gryphe
|
|
"mythomax-13b": "MythoMax-L2-13b-Lite",
|
|
"mythomax-13b": "MythoMax-L2-13b",
|
|
|
|
# openchat
|
|
"openchat-3.5": "openchat-3.5-0106",
|
|
|
|
# qwen
|
|
#"qwen-1.5-72b": "Qwen1.5-72B-Chat", # Empty answer
|
|
#"qwen-1.5-110b": "Qwen1.5-110B-Chat", # Empty answer
|
|
"qwen-2-72b": "Qwen2-72B-Instruct",
|
|
"qwen-2-5-7b": "Qwen2.5-7B-Instruct-Turbo",
|
|
"qwen-2-5-72b": "Qwen2.5-72B-Instruct-Turbo",
|
|
|
|
# google
|
|
"gemma-2b": "gemma-2b-it",
|
|
"gemma-2-9b": "gemma-2-9b-it",
|
|
"gemma-2b-27b": "gemma-2-27b-it",
|
|
|
|
# gemini
|
|
"gemini-flash": "gemini-1.5-flash",
|
|
"gemini-pro": "gemini-1.5-pro",
|
|
|
|
# databricks
|
|
"dbrx-instruct": "dbrx-instruct",
|
|
|
|
# deepseek-ai
|
|
#"deepseek-coder": "deepseek-coder-6.7b-base",
|
|
"deepseek-coder": "deepseek-coder-6.7b-instruct",
|
|
#"deepseek-math": "deepseek-math-7b-instruct",
|
|
|
|
# NousResearch
|
|
#"deepseek-math": "deepseek-math-7b-instruct",
|
|
"hermes-2-dpo": "Nous-Hermes-2-Mixtral-8x7B-DPO",
|
|
"hermes-2": "hermes-2-pro-mistral-7b",
|
|
|
|
# teknium
|
|
"openhermes-2.5": "openhermes-2.5-mistral-7b",
|
|
|
|
# microsoft
|
|
"wizardlm-2-8x22b": "WizardLM-2-8x22B",
|
|
#"phi-2": "phi-2",
|
|
|
|
# upstage
|
|
"solar-10-7b": "SOLAR-10.7B-Instruct-v1.0",
|
|
|
|
# pawan
|
|
#"cosmosrp": "cosmosrp",
|
|
|
|
# liquid
|
|
"lfm-40b": "lfm-40b-moe",
|
|
|
|
# DiscoResearch
|
|
"german-7b": "discolm-german-7b-v1",
|
|
|
|
# tiiuae
|
|
#"falcon-7b": "falcon-7b-instruct",
|
|
|
|
# defog
|
|
#"sqlcoder-7b": "sqlcoder-7b-2",
|
|
|
|
# tinyllama
|
|
#"tinyllama-1b": "tinyllama-1.1b-chat",
|
|
|
|
# HuggingFaceH4
|
|
"zephyr-7b": "zephyr-7b-beta",
|
|
}
|
|
|
|
@classmethod
|
|
async def create_async_generator(
|
|
cls,
|
|
model: str,
|
|
messages: Messages,
|
|
stream: bool = False,
|
|
proxy: str = None,
|
|
max_tokens: str = 4096,
|
|
temperature: str = 1,
|
|
top_p: str = 1,
|
|
**kwargs
|
|
) -> AsyncResult:
|
|
model = cls.get_model(model)
|
|
|
|
chunked_messages = split_messages(messages)
|
|
|
|
headers = {
|
|
'accept': '*/*',
|
|
'accept-language': 'en-US,en;q=0.9',
|
|
'authorization': 'Bearer missing api key',
|
|
'cache-control': 'no-cache',
|
|
'content-type': 'application/json',
|
|
'origin': 'https://llmplayground.net',
|
|
'pragma': 'no-cache',
|
|
'priority': 'u=1, i',
|
|
'referer': 'https://llmplayground.net/',
|
|
'sec-ch-ua': '"Not?A_Brand";v="99", "Chromium";v="130"',
|
|
'sec-ch-ua-mobile': '?0',
|
|
'sec-ch-ua-platform': '"Linux"',
|
|
'sec-fetch-dest': 'empty',
|
|
'sec-fetch-mode': 'cors',
|
|
'sec-fetch-site': 'cross-site',
|
|
'user-agent': 'Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/130.0.0.0 Safari/537.36'
|
|
}
|
|
|
|
data = {
|
|
"messages": chunked_messages,
|
|
"model": model,
|
|
"max_tokens": max_tokens,
|
|
"temperature": temperature,
|
|
"top_p": top_p,
|
|
"stream": stream
|
|
}
|
|
|
|
async with ClientSession(headers=headers) as session:
|
|
async with session.post(cls.api_endpoint_completions, json=data, proxy=proxy) as response:
|
|
response.raise_for_status()
|
|
text = ""
|
|
if stream:
|
|
async for line in response.content:
|
|
line = line.decode('utf-8')
|
|
if line.startswith('data: '):
|
|
json_str = line[6:]
|
|
try:
|
|
chunk = json.loads(json_str)
|
|
if 'choices' in chunk and chunk['choices']:
|
|
content = chunk['choices'][0].get('delta', {}).get('content', '')
|
|
text += content # Збираємо дельти
|
|
except json.JSONDecodeError as e:
|
|
print(f"Error decoding JSON: {json_str}, Error: {e}")
|
|
elif line.strip() == "[DONE]":
|
|
break
|
|
yield clean_response(text)
|
|
else:
|
|
response_json = await response.json()
|
|
text = response_json["choices"][0]["message"]["content"]
|
|
yield clean_response(text)
|
|
|