2023-09-30 22:27:21 -04:00
|
|
|
from __future__ import annotations
|
2024-02-21 18:16:58 -05:00
|
|
|
|
2023-09-17 17:23:54 -04:00
|
|
|
from dataclasses import dataclass
|
2024-02-21 18:16:58 -05:00
|
|
|
|
2024-01-01 11:48:57 -05:00
|
|
|
from .Provider import RetryProvider, ProviderType
|
2023-09-30 22:27:21 -04:00
|
|
|
from .Provider import (
|
2023-11-16 10:56:23 -05:00
|
|
|
Chatgpt4Online,
|
2024-01-22 23:02:14 -05:00
|
|
|
PerplexityLabs,
|
2023-11-17 22:38:31 -05:00
|
|
|
ChatgptDemoAi,
|
2024-01-13 10:18:31 -05:00
|
|
|
GeminiProChat,
|
2023-11-17 22:38:31 -05:00
|
|
|
ChatgptNext,
|
2023-12-06 03:35:36 -05:00
|
|
|
HuggingChat,
|
2023-12-24 19:38:42 -05:00
|
|
|
ChatgptDemo,
|
2024-01-10 04:34:56 -05:00
|
|
|
FreeChatgpt,
|
2023-10-13 18:31:48 -04:00
|
|
|
GptForLove,
|
2023-09-30 22:27:21 -04:00
|
|
|
ChatgptAi,
|
2023-10-26 15:32:49 -04:00
|
|
|
DeepInfra,
|
2023-10-21 19:22:25 -04:00
|
|
|
ChatBase,
|
2023-11-17 22:38:31 -05:00
|
|
|
Liaobots,
|
2023-10-01 20:04:22 -04:00
|
|
|
FreeGpt,
|
2023-10-26 15:32:49 -04:00
|
|
|
Llama2,
|
2024-02-09 08:24:15 -05:00
|
|
|
Vercel,
|
|
|
|
Gemini,
|
2023-09-30 22:27:21 -04:00
|
|
|
GptGo,
|
2023-12-24 19:38:42 -05:00
|
|
|
Gpt6,
|
2023-09-30 22:27:21 -04:00
|
|
|
Bing,
|
2023-10-04 23:13:37 -04:00
|
|
|
You,
|
2023-12-01 17:56:12 -05:00
|
|
|
Pi,
|
2023-09-17 17:37:14 -04:00
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
2023-09-20 00:12:34 -04:00
|
|
|
@dataclass(unsafe_hash=True)
|
2023-09-17 17:23:54 -04:00
|
|
|
class Model:
|
2024-01-14 01:45:41 -05:00
|
|
|
"""
|
|
|
|
Represents a machine learning model configuration.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
name (str): Name of the model.
|
|
|
|
base_provider (str): Default provider for the model.
|
|
|
|
best_provider (ProviderType): The preferred provider for the model, typically with retry logic.
|
|
|
|
"""
|
2023-09-17 17:23:54 -04:00
|
|
|
name: str
|
|
|
|
base_provider: str
|
2024-01-01 11:48:57 -05:00
|
|
|
best_provider: ProviderType = None
|
2023-10-19 10:14:48 -04:00
|
|
|
|
|
|
|
@staticmethod
|
|
|
|
def __all__() -> list[str]:
|
2024-01-14 01:45:41 -05:00
|
|
|
"""Returns a list of all model names."""
|
2023-10-19 10:14:48 -04:00
|
|
|
return _all_models
|
2023-09-17 17:23:54 -04:00
|
|
|
|
|
|
|
default = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = "",
|
|
|
|
base_provider = "",
|
|
|
|
best_provider = RetryProvider([
|
2023-11-16 10:56:23 -05:00
|
|
|
Bing,
|
2024-02-09 08:24:15 -05:00
|
|
|
ChatgptAi, GptGo,
|
2023-11-16 10:56:23 -05:00
|
|
|
You,
|
2024-01-02 08:58:28 -05:00
|
|
|
Chatgpt4Online
|
2023-10-04 23:13:37 -04:00
|
|
|
])
|
|
|
|
)
|
|
|
|
|
2023-11-16 10:56:23 -05:00
|
|
|
# GPT-3.5 too, but all providers supports long requests and responses
|
2023-10-04 23:13:37 -04:00
|
|
|
gpt_35_long = Model(
|
|
|
|
name = 'gpt-3.5-turbo',
|
|
|
|
base_provider = 'openai',
|
|
|
|
best_provider = RetryProvider([
|
2023-11-12 12:03:04 -05:00
|
|
|
FreeGpt, You,
|
2023-11-16 10:56:23 -05:00
|
|
|
Chatgpt4Online,
|
2023-11-17 22:38:31 -05:00
|
|
|
ChatgptDemoAi,
|
|
|
|
ChatgptNext,
|
2023-12-24 19:38:42 -05:00
|
|
|
ChatgptDemo,
|
|
|
|
Gpt6,
|
2023-09-21 14:10:59 -04:00
|
|
|
])
|
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
|
|
|
# GPT-3.5 / GPT-4
|
|
|
|
gpt_35_turbo = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-3.5-turbo',
|
|
|
|
base_provider = 'openai',
|
2024-01-22 19:47:55 -05:00
|
|
|
best_provider = RetryProvider([
|
2024-01-13 09:58:12 -05:00
|
|
|
GptGo, You,
|
2023-11-16 10:56:23 -05:00
|
|
|
GptForLove, ChatBase,
|
|
|
|
Chatgpt4Online,
|
2023-09-21 14:10:59 -04:00
|
|
|
])
|
2023-09-17 17:23:54 -04:00
|
|
|
)
|
|
|
|
|
|
|
|
gpt_4 = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-4',
|
|
|
|
base_provider = 'openai',
|
2023-10-10 09:11:17 -04:00
|
|
|
best_provider = RetryProvider([
|
2024-02-09 02:49:37 -05:00
|
|
|
Bing, Liaobots,
|
2023-10-10 09:11:17 -04:00
|
|
|
])
|
2023-09-22 19:44:09 -04:00
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
2023-12-20 19:03:28 -05:00
|
|
|
gpt_4_turbo = Model(
|
|
|
|
name = 'gpt-4-turbo',
|
|
|
|
base_provider = 'openai',
|
|
|
|
best_provider = Bing
|
|
|
|
)
|
|
|
|
|
2023-10-26 15:32:49 -04:00
|
|
|
llama2_7b = Model(
|
|
|
|
name = "meta-llama/Llama-2-7b-chat-hf",
|
|
|
|
base_provider = 'huggingface',
|
2024-01-01 11:48:57 -05:00
|
|
|
best_provider = RetryProvider([Llama2, DeepInfra])
|
|
|
|
)
|
2023-10-26 15:32:49 -04:00
|
|
|
|
|
|
|
llama2_13b = Model(
|
2023-11-12 04:12:05 -05:00
|
|
|
name = "meta-llama/Llama-2-13b-chat-hf",
|
2023-10-26 15:32:49 -04:00
|
|
|
base_provider = 'huggingface',
|
2024-01-01 11:48:57 -05:00
|
|
|
best_provider = RetryProvider([Llama2, DeepInfra])
|
|
|
|
)
|
2023-10-26 15:32:49 -04:00
|
|
|
|
|
|
|
llama2_70b = Model(
|
|
|
|
name = "meta-llama/Llama-2-70b-chat-hf",
|
|
|
|
base_provider = "huggingface",
|
2024-01-22 23:02:14 -05:00
|
|
|
best_provider = RetryProvider([Llama2, DeepInfra, HuggingChat, PerplexityLabs])
|
|
|
|
)
|
|
|
|
|
|
|
|
codellama_34b_instruct = Model(
|
|
|
|
name = "codellama/CodeLlama-34b-Instruct-hf",
|
|
|
|
base_provider = "huggingface",
|
2024-01-23 05:35:37 -05:00
|
|
|
best_provider = RetryProvider([HuggingChat, PerplexityLabs, DeepInfra])
|
2024-01-01 11:48:57 -05:00
|
|
|
)
|
2023-10-26 15:32:49 -04:00
|
|
|
|
2024-02-04 13:50:32 -05:00
|
|
|
codellama_70b_instruct = Model(
|
|
|
|
name = "codellama/CodeLlama-70b-Instruct-hf",
|
|
|
|
base_provider = "huggingface",
|
|
|
|
best_provider = DeepInfra
|
|
|
|
)
|
|
|
|
|
2024-01-23 05:35:37 -05:00
|
|
|
# Mistral
|
2023-12-13 07:15:27 -05:00
|
|
|
mixtral_8x7b = Model(
|
|
|
|
name = "mistralai/Mixtral-8x7B-Instruct-v0.1",
|
|
|
|
base_provider = "huggingface",
|
2024-01-22 23:02:14 -05:00
|
|
|
best_provider = RetryProvider([DeepInfra, HuggingChat, PerplexityLabs])
|
2024-01-01 11:48:57 -05:00
|
|
|
)
|
2023-12-13 07:15:27 -05:00
|
|
|
|
|
|
|
mistral_7b = Model(
|
|
|
|
name = "mistralai/Mistral-7B-Instruct-v0.1",
|
|
|
|
base_provider = "huggingface",
|
2024-01-22 23:02:14 -05:00
|
|
|
best_provider = RetryProvider([DeepInfra, HuggingChat, PerplexityLabs])
|
2024-01-01 11:48:57 -05:00
|
|
|
)
|
|
|
|
|
2024-01-23 05:35:37 -05:00
|
|
|
# Misc models
|
2024-01-21 00:20:45 -05:00
|
|
|
dolphin_mixtral_8x7b = Model(
|
|
|
|
name = "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
|
|
|
|
base_provider = "huggingface",
|
|
|
|
best_provider = DeepInfra
|
|
|
|
)
|
|
|
|
|
2024-01-23 05:35:37 -05:00
|
|
|
lzlv_70b = Model(
|
|
|
|
name = "lizpreciatior/lzlv_70b_fp16_hf",
|
|
|
|
base_provider = "huggingface",
|
|
|
|
best_provider = DeepInfra
|
|
|
|
)
|
|
|
|
|
|
|
|
airoboros_70b = Model(
|
|
|
|
name = "deepinfra/airoboros-70b",
|
|
|
|
base_provider = "huggingface",
|
|
|
|
best_provider = DeepInfra
|
|
|
|
)
|
|
|
|
|
|
|
|
airoboros_l2_70b = Model(
|
|
|
|
name = "jondurbin/airoboros-l2-70b-gpt4-1.4.1",
|
|
|
|
base_provider = "huggingface",
|
|
|
|
best_provider = DeepInfra
|
|
|
|
)
|
|
|
|
|
2024-01-01 11:48:57 -05:00
|
|
|
openchat_35 = Model(
|
|
|
|
name = "openchat/openchat_3.5",
|
|
|
|
base_provider = "huggingface",
|
|
|
|
best_provider = RetryProvider([DeepInfra, HuggingChat])
|
|
|
|
)
|
2023-12-13 07:15:27 -05:00
|
|
|
|
2023-09-17 17:23:54 -04:00
|
|
|
# Bard
|
2024-02-09 08:24:15 -05:00
|
|
|
gemini = bard = palm = Model(
|
|
|
|
name = 'gemini',
|
2023-09-30 22:27:21 -04:00
|
|
|
base_provider = 'google',
|
2024-02-09 08:24:15 -05:00
|
|
|
best_provider = Gemini
|
2024-01-22 23:02:14 -05:00
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
|
|
|
claude_v2 = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'claude-v2',
|
|
|
|
base_provider = 'anthropic',
|
2024-01-22 23:02:14 -05:00
|
|
|
best_provider = RetryProvider([FreeChatgpt, Vercel])
|
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
|
|
|
gpt_35_turbo_16k = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-3.5-turbo-16k',
|
|
|
|
base_provider = 'openai',
|
2024-01-22 23:02:14 -05:00
|
|
|
best_provider = gpt_35_long.best_provider
|
|
|
|
)
|
2023-09-19 23:00:19 -04:00
|
|
|
|
2023-09-17 17:23:54 -04:00
|
|
|
gpt_35_turbo_16k_0613 = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-3.5-turbo-16k-0613',
|
2023-10-10 09:11:17 -04:00
|
|
|
base_provider = 'openai',
|
2023-10-19 14:37:56 -04:00
|
|
|
best_provider = gpt_35_long.best_provider
|
2023-10-10 09:11:17 -04:00
|
|
|
)
|
2023-09-22 15:36:44 -04:00
|
|
|
|
|
|
|
gpt_35_turbo_0613 = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-3.5-turbo-0613',
|
2023-10-09 18:45:44 -04:00
|
|
|
base_provider = 'openai',
|
2023-10-11 13:56:53 -04:00
|
|
|
best_provider = gpt_35_turbo.best_provider
|
2023-09-25 09:52:19 -04:00
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
|
|
|
gpt_4_0613 = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-4-0613',
|
2023-10-10 09:11:17 -04:00
|
|
|
base_provider = 'openai',
|
2023-10-11 13:56:53 -04:00
|
|
|
best_provider = gpt_4.best_provider
|
2023-10-07 13:10:26 -04:00
|
|
|
)
|
2023-09-29 10:21:18 -04:00
|
|
|
|
|
|
|
gpt_4_32k = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-4-32k',
|
2023-10-10 09:11:17 -04:00
|
|
|
base_provider = 'openai',
|
2023-10-11 13:56:53 -04:00
|
|
|
best_provider = gpt_4.best_provider
|
2023-10-07 13:10:26 -04:00
|
|
|
)
|
2023-09-29 10:21:18 -04:00
|
|
|
|
|
|
|
gpt_4_32k_0613 = Model(
|
2023-09-30 22:27:21 -04:00
|
|
|
name = 'gpt-4-32k-0613',
|
2023-10-10 09:11:17 -04:00
|
|
|
base_provider = 'openai',
|
2023-10-11 13:56:53 -04:00
|
|
|
best_provider = gpt_4.best_provider
|
2023-10-07 13:10:26 -04:00
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
2024-01-13 09:58:12 -05:00
|
|
|
gemini_pro = Model(
|
|
|
|
name = 'gemini-pro',
|
|
|
|
base_provider = 'google',
|
2024-01-13 10:18:31 -05:00
|
|
|
best_provider = RetryProvider([FreeChatgpt, GeminiProChat])
|
2024-01-13 09:58:12 -05:00
|
|
|
)
|
|
|
|
|
2023-12-01 17:11:52 -05:00
|
|
|
pi = Model(
|
|
|
|
name = 'pi',
|
|
|
|
base_provider = 'inflection',
|
2024-01-22 19:47:55 -05:00
|
|
|
best_provider = Pi
|
2023-12-01 17:11:52 -05:00
|
|
|
)
|
2023-09-17 17:23:54 -04:00
|
|
|
|
|
|
|
class ModelUtils:
|
2024-01-14 01:45:41 -05:00
|
|
|
"""
|
|
|
|
Utility class for mapping string identifiers to Model instances.
|
|
|
|
|
|
|
|
Attributes:
|
|
|
|
convert (dict[str, Model]): Dictionary mapping model string identifiers to Model instances.
|
|
|
|
"""
|
2023-09-17 17:23:54 -04:00
|
|
|
convert: dict[str, Model] = {
|
2023-09-30 22:27:21 -04:00
|
|
|
# gpt-3.5
|
|
|
|
'gpt-3.5-turbo' : gpt_35_turbo,
|
2023-10-06 14:53:17 -04:00
|
|
|
'gpt-3.5-turbo-0613' : gpt_35_turbo_0613,
|
2023-09-30 22:27:21 -04:00
|
|
|
'gpt-3.5-turbo-16k' : gpt_35_turbo_16k,
|
|
|
|
'gpt-3.5-turbo-16k-0613' : gpt_35_turbo_16k_0613,
|
|
|
|
|
2023-12-06 05:54:50 -05:00
|
|
|
'gpt-3.5-long': gpt_35_long,
|
|
|
|
|
2023-09-30 22:27:21 -04:00
|
|
|
# gpt-4
|
|
|
|
'gpt-4' : gpt_4,
|
|
|
|
'gpt-4-0613' : gpt_4_0613,
|
|
|
|
'gpt-4-32k' : gpt_4_32k,
|
|
|
|
'gpt-4-32k-0613' : gpt_4_32k_0613,
|
2023-12-20 19:03:28 -05:00
|
|
|
'gpt-4-turbo' : gpt_4_turbo,
|
2023-10-26 15:42:30 -04:00
|
|
|
|
|
|
|
# Llama 2
|
|
|
|
'llama2-7b' : llama2_7b,
|
|
|
|
'llama2-13b': llama2_13b,
|
|
|
|
'llama2-70b': llama2_70b,
|
2024-01-22 23:02:14 -05:00
|
|
|
'codellama-34b-instruct': codellama_34b_instruct,
|
2024-02-04 13:50:32 -05:00
|
|
|
'codellama-70b-instruct': codellama_70b_instruct,
|
2023-09-30 22:27:21 -04:00
|
|
|
|
2023-12-13 07:15:27 -05:00
|
|
|
'mixtral-8x7b': mixtral_8x7b,
|
|
|
|
'mistral-7b': mistral_7b,
|
2024-01-21 00:20:45 -05:00
|
|
|
'dolphin-mixtral-8x7b': dolphin_mixtral_8x7b,
|
2024-01-23 05:35:37 -05:00
|
|
|
'lzlv-70b': lzlv_70b,
|
|
|
|
'airoboros-70b': airoboros_70b,
|
|
|
|
'airoboros-l2-70b': airoboros_l2_70b,
|
2024-01-01 11:48:57 -05:00
|
|
|
'openchat_3.5': openchat_35,
|
2024-02-09 08:24:15 -05:00
|
|
|
'gemini': gemini,
|
2024-01-13 09:58:12 -05:00
|
|
|
'gemini-pro': gemini_pro,
|
2024-01-22 23:02:14 -05:00
|
|
|
'claude-v2': claude_v2,
|
2023-12-01 17:11:52 -05:00
|
|
|
'pi': pi
|
2023-09-30 22:27:21 -04:00
|
|
|
}
|
2023-10-19 10:14:48 -04:00
|
|
|
|
2024-02-04 13:50:32 -05:00
|
|
|
_all_models = list(ModelUtils.convert.keys())
|