From 1e62a9dd60d69de636845497ffe9512fe60dfa2a Mon Sep 17 00:00:00 2001 From: kqlio67 Date: Wed, 25 Sep 2024 20:05:39 +0300 Subject: feat(g4f/Provider/HuggingChat.py): update model list and aliases --- g4f/Provider/HuggingChat.py | 12 ++++++------ g4f/models.py | 29 +++++++++++++++++++++-------- 2 files changed, 27 insertions(+), 14 deletions(-) (limited to 'g4f') diff --git a/g4f/Provider/HuggingChat.py b/g4f/Provider/HuggingChat.py index 01490e2f..488a1114 100644 --- a/g4f/Provider/HuggingChat.py +++ b/g4f/Provider/HuggingChat.py @@ -18,9 +18,9 @@ class HuggingChat(AbstractProvider, ProviderModelMixin): 'CohereForAI/c4ai-command-r-plus-08-2024', 'Qwen/Qwen2.5-72B-Instruct', 'mistralai/Mixtral-8x7B-Instruct-v0.1', - 'NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO', - 'mistralai/Mistral-7B-Instruct-v0.3', - 'microsoft/Phi-3-mini-4k-instruct', + 'NousResearch/Hermes-3-Llama-3.1-8B', + 'mistralai/Mistral-Nemo-Instruct-2407', + 'microsoft/Phi-3.5-mini-instruct', ] model_aliases = { @@ -28,9 +28,9 @@ class HuggingChat(AbstractProvider, ProviderModelMixin): "command-r-plus": "CohereForAI/c4ai-command-r-plus-08-2024", "qwen-2-72b": "Qwen/Qwen2.5-72B-Instruct", "mixtral-8x7b": "mistralai/Mixtral-8x7B-Instruct-v0.1", - "mixtral-8x7b-dpo": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO", - "mistral-7b": "mistralai/Mistral-7B-Instruct-v0.3", - "phi-3-mini-4k": "microsoft/Phi-3-mini-4k-instruct", + "hermes-3": "NousResearch/Hermes-3-Llama-3.1-8B", + "mistral-nemo": "mistralai/Mistral-Nemo-Instruct-2407", + "phi-3.5-mini": "microsoft/Phi-3.5-mini-instruct", } @classmethod diff --git a/g4f/models.py b/g4f/models.py index 2f4405a3..a6ff9e13 100644 --- a/g4f/models.py +++ b/g4f/models.py @@ -249,27 +249,39 @@ mixtral_8x22b = Model( best_provider = IterListProvider([DeepInfraChat, Airforce]) ) +mistral_nemo = Model( + name = "mistral-nemo", + base_provider = "Mistral", + best_provider = IterListProvider([HuggingChat, HuggingFace]) +) + ### NousResearch ### mixtral_8x7b_dpo = Model( name = "mixtral-8x7b-dpo", base_provider = "NousResearch", - best_provider = IterListProvider([HuggingChat, Airforce, HuggingFace]) + best_provider = IterListProvider([Airforce]) ) -### Microsoft ### -phi_3_mini_4k = Model( - name = "phi-3-mini-4k", - base_provider = "Microsoft", +hermes_3 = Model( + name = "hermes-3", + base_provider = "NousResearch", best_provider = IterListProvider([HuggingChat, HuggingFace]) ) + +### Microsoft ### phi_3_medium_4k = Model( name = "phi-3-medium-4k", base_provider = "Microsoft", best_provider = IterListProvider([DeepInfraChat]) ) +phi_3_5_mini = Model( + name = "phi-3.5-mini", + base_provider = "Microsoft", + best_provider = IterListProvider([HuggingChat, HuggingFace]) +) ### Google DeepMind ### # gemini @@ -800,18 +812,19 @@ class ModelUtils: 'mistral-7b': mistral_7b, 'mixtral-8x7b': mixtral_8x7b, 'mixtral-8x22b': mixtral_8x22b, +'mistral-nemo': mistral_nemo, ### NousResearch ### -'mixtral-8x7b-dpo': mixtral_8x7b_dpo, +'mixtral-8x7b-dpo': mixtral_8x7b_dpo, +'hermes-3': hermes_3, 'yi-34b': yi_34b, ### Microsoft ### -'phi-3-mini-4k': phi_3_mini_4k, 'phi_3_medium-4k': phi_3_medium_4k, - +'phi-3.5-mini': phi_3_5_mini, ### Google ### # gemini -- cgit v1.2.3