feat(g4f/Provider/HuggingChat.py): update model list and aliases

This commit is contained in:
kqlio67 2024-09-25 20:05:39 +03:00
parent ec4e25073b
commit 1e62a9dd60
2 changed files with 27 additions and 14 deletions

View file

@ -18,9 +18,9 @@ class HuggingChat(AbstractProvider, ProviderModelMixin):
'CohereForAI/c4ai-command-r-plus-08-2024', 'CohereForAI/c4ai-command-r-plus-08-2024',
'Qwen/Qwen2.5-72B-Instruct', 'Qwen/Qwen2.5-72B-Instruct',
'mistralai/Mixtral-8x7B-Instruct-v0.1', 'mistralai/Mixtral-8x7B-Instruct-v0.1',
'NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO', 'NousResearch/Hermes-3-Llama-3.1-8B',
'mistralai/Mistral-7B-Instruct-v0.3', 'mistralai/Mistral-Nemo-Instruct-2407',
'microsoft/Phi-3-mini-4k-instruct', 'microsoft/Phi-3.5-mini-instruct',
] ]
model_aliases = { model_aliases = {
@ -28,9 +28,9 @@ class HuggingChat(AbstractProvider, ProviderModelMixin):
"command-r-plus": "CohereForAI/c4ai-command-r-plus-08-2024", "command-r-plus": "CohereForAI/c4ai-command-r-plus-08-2024",
"qwen-2-72b": "Qwen/Qwen2.5-72B-Instruct", "qwen-2-72b": "Qwen/Qwen2.5-72B-Instruct",
"mixtral-8x7b": "mistralai/Mixtral-8x7B-Instruct-v0.1", "mixtral-8x7b": "mistralai/Mixtral-8x7B-Instruct-v0.1",
"mixtral-8x7b-dpo": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO", "hermes-3": "NousResearch/Hermes-3-Llama-3.1-8B",
"mistral-7b": "mistralai/Mistral-7B-Instruct-v0.3", "mistral-nemo": "mistralai/Mistral-Nemo-Instruct-2407",
"phi-3-mini-4k": "microsoft/Phi-3-mini-4k-instruct", "phi-3.5-mini": "microsoft/Phi-3.5-mini-instruct",
} }
@classmethod @classmethod

View file

@ -249,27 +249,39 @@ mixtral_8x22b = Model(
best_provider = IterListProvider([DeepInfraChat, Airforce]) best_provider = IterListProvider([DeepInfraChat, Airforce])
) )
mistral_nemo = Model(
name = "mistral-nemo",
base_provider = "Mistral",
best_provider = IterListProvider([HuggingChat, HuggingFace])
)
### NousResearch ### ### NousResearch ###
mixtral_8x7b_dpo = Model( mixtral_8x7b_dpo = Model(
name = "mixtral-8x7b-dpo", name = "mixtral-8x7b-dpo",
base_provider = "NousResearch", base_provider = "NousResearch",
best_provider = IterListProvider([HuggingChat, Airforce, HuggingFace]) best_provider = IterListProvider([Airforce])
) )
### Microsoft ### hermes_3 = Model(
phi_3_mini_4k = Model( name = "hermes-3",
name = "phi-3-mini-4k", base_provider = "NousResearch",
base_provider = "Microsoft",
best_provider = IterListProvider([HuggingChat, HuggingFace]) best_provider = IterListProvider([HuggingChat, HuggingFace])
) )
### Microsoft ###
phi_3_medium_4k = Model( phi_3_medium_4k = Model(
name = "phi-3-medium-4k", name = "phi-3-medium-4k",
base_provider = "Microsoft", base_provider = "Microsoft",
best_provider = IterListProvider([DeepInfraChat]) best_provider = IterListProvider([DeepInfraChat])
) )
phi_3_5_mini = Model(
name = "phi-3.5-mini",
base_provider = "Microsoft",
best_provider = IterListProvider([HuggingChat, HuggingFace])
)
### Google DeepMind ### ### Google DeepMind ###
# gemini # gemini
@ -800,18 +812,19 @@ class ModelUtils:
'mistral-7b': mistral_7b, 'mistral-7b': mistral_7b,
'mixtral-8x7b': mixtral_8x7b, 'mixtral-8x7b': mixtral_8x7b,
'mixtral-8x22b': mixtral_8x22b, 'mixtral-8x22b': mixtral_8x22b,
'mistral-nemo': mistral_nemo,
### NousResearch ### ### NousResearch ###
'mixtral-8x7b-dpo': mixtral_8x7b_dpo, 'mixtral-8x7b-dpo': mixtral_8x7b_dpo,
'hermes-3': hermes_3,
'yi-34b': yi_34b, 'yi-34b': yi_34b,
### Microsoft ### ### Microsoft ###
'phi-3-mini-4k': phi_3_mini_4k,
'phi_3_medium-4k': phi_3_medium_4k, 'phi_3_medium-4k': phi_3_medium_4k,
'phi-3.5-mini': phi_3_5_mini,
### Google ### ### Google ###
# gemini # gemini