summaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
-rw-r--r--g4f/Provider/HuggingChat.py12
-rw-r--r--g4f/models.py29
2 files changed, 27 insertions, 14 deletions
diff --git a/g4f/Provider/HuggingChat.py b/g4f/Provider/HuggingChat.py
index 01490e2f..488a1114 100644
--- a/g4f/Provider/HuggingChat.py
+++ b/g4f/Provider/HuggingChat.py
@@ -18,9 +18,9 @@ class HuggingChat(AbstractProvider, ProviderModelMixin):
'CohereForAI/c4ai-command-r-plus-08-2024',
'Qwen/Qwen2.5-72B-Instruct',
'mistralai/Mixtral-8x7B-Instruct-v0.1',
- 'NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO',
- 'mistralai/Mistral-7B-Instruct-v0.3',
- 'microsoft/Phi-3-mini-4k-instruct',
+ 'NousResearch/Hermes-3-Llama-3.1-8B',
+ 'mistralai/Mistral-Nemo-Instruct-2407',
+ 'microsoft/Phi-3.5-mini-instruct',
]
model_aliases = {
@@ -28,9 +28,9 @@ class HuggingChat(AbstractProvider, ProviderModelMixin):
"command-r-plus": "CohereForAI/c4ai-command-r-plus-08-2024",
"qwen-2-72b": "Qwen/Qwen2.5-72B-Instruct",
"mixtral-8x7b": "mistralai/Mixtral-8x7B-Instruct-v0.1",
- "mixtral-8x7b-dpo": "NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO",
- "mistral-7b": "mistralai/Mistral-7B-Instruct-v0.3",
- "phi-3-mini-4k": "microsoft/Phi-3-mini-4k-instruct",
+ "hermes-3": "NousResearch/Hermes-3-Llama-3.1-8B",
+ "mistral-nemo": "mistralai/Mistral-Nemo-Instruct-2407",
+ "phi-3.5-mini": "microsoft/Phi-3.5-mini-instruct",
}
@classmethod
diff --git a/g4f/models.py b/g4f/models.py
index 2f4405a3..a6ff9e13 100644
--- a/g4f/models.py
+++ b/g4f/models.py
@@ -249,27 +249,39 @@ mixtral_8x22b = Model(
best_provider = IterListProvider([DeepInfraChat, Airforce])
)
+mistral_nemo = Model(
+ name = "mistral-nemo",
+ base_provider = "Mistral",
+ best_provider = IterListProvider([HuggingChat, HuggingFace])
+)
+
### NousResearch ###
mixtral_8x7b_dpo = Model(
name = "mixtral-8x7b-dpo",
base_provider = "NousResearch",
- best_provider = IterListProvider([HuggingChat, Airforce, HuggingFace])
+ best_provider = IterListProvider([Airforce])
)
-### Microsoft ###
-phi_3_mini_4k = Model(
- name = "phi-3-mini-4k",
- base_provider = "Microsoft",
+hermes_3 = Model(
+ name = "hermes-3",
+ base_provider = "NousResearch",
best_provider = IterListProvider([HuggingChat, HuggingFace])
)
+
+### Microsoft ###
phi_3_medium_4k = Model(
name = "phi-3-medium-4k",
base_provider = "Microsoft",
best_provider = IterListProvider([DeepInfraChat])
)
+phi_3_5_mini = Model(
+ name = "phi-3.5-mini",
+ base_provider = "Microsoft",
+ best_provider = IterListProvider([HuggingChat, HuggingFace])
+)
### Google DeepMind ###
# gemini
@@ -800,18 +812,19 @@ class ModelUtils:
'mistral-7b': mistral_7b,
'mixtral-8x7b': mixtral_8x7b,
'mixtral-8x22b': mixtral_8x22b,
+'mistral-nemo': mistral_nemo,
### NousResearch ###
-'mixtral-8x7b-dpo': mixtral_8x7b_dpo,
+'mixtral-8x7b-dpo': mixtral_8x7b_dpo,
+'hermes-3': hermes_3,
'yi-34b': yi_34b,
### Microsoft ###
-'phi-3-mini-4k': phi_3_mini_4k,
'phi_3_medium-4k': phi_3_medium_4k,
-
+'phi-3.5-mini': phi_3_5_mini,
### Google ###
# gemini