From 5fd118f3c9d3d3a932695a3b413d8926d8ad58c0 Mon Sep 17 00:00:00 2001
From: PD <56485898+pratham-darooka@users.noreply.github.com>
Date: Fri, 19 Apr 2024 12:57:33 +0530
Subject: Added Meta llama-3 support! (#1856)

* Added Meta llama-3 support!
Decided to change llama2.py to llama.py to hold all the llama family models.

* updated HuggingChat provider

* Update FlowGpt.py
---
 g4f/Provider/FlowGpt.py     |  2 +-
 g4f/Provider/HuggingChat.py |  3 +-
 g4f/Provider/Llama.py       | 91 +++++++++++++++++++++++++++++++++++++++++++++
 g4f/Provider/Llama2.py      | 87 -------------------------------------------
 g4f/Provider/__init__.py    |  2 +-
 5 files changed, 95 insertions(+), 90 deletions(-)
 create mode 100644 g4f/Provider/Llama.py
 delete mode 100644 g4f/Provider/Llama2.py

(limited to 'g4f/Provider')

diff --git a/g4f/Provider/FlowGpt.py b/g4f/Provider/FlowGpt.py
index 7edd6f19..6c2aa046 100644
--- a/g4f/Provider/FlowGpt.py
+++ b/g4f/Provider/FlowGpt.py
@@ -99,4 +99,4 @@ class FlowGpt(AsyncGeneratorProvider, ProviderModelMixin):
                         if "event" not in message:
                             continue
                         if message["event"] == "text":
-                            yield message["data"]
\ No newline at end of file
+                            yield message["data"]
diff --git a/g4f/Provider/HuggingChat.py b/g4f/Provider/HuggingChat.py
index 882edb78..668ce4b1 100644
--- a/g4f/Provider/HuggingChat.py
+++ b/g4f/Provider/HuggingChat.py
@@ -19,7 +19,8 @@ class HuggingChat(AsyncGeneratorProvider, ProviderModelMixin):
         'mistralai/Mixtral-8x7B-Instruct-v0.1',
         'google/gemma-1.1-7b-it',
         'NousResearch/Nous-Hermes-2-Mixtral-8x7B-DPO',
-        'mistralai/Mistral-7B-Instruct-v0.2'
+        'mistralai/Mistral-7B-Instruct-v0.2',
+        'meta-llama/Meta-Llama-3-70B-Instruct'
     ]
     model_aliases = {
         "openchat/openchat_3.5": "openchat/openchat-3.5-0106",
diff --git a/g4f/Provider/Llama.py b/g4f/Provider/Llama.py
new file mode 100644
index 00000000..4d19866e
--- /dev/null
+++ b/g4f/Provider/Llama.py
@@ -0,0 +1,91 @@
+from __future__ import annotations
+
+from aiohttp import ClientSession
+
+from ..typing import AsyncResult, Messages
+from ..requests.raise_for_status import raise_for_status
+from .base_provider import AsyncGeneratorProvider, ProviderModelMixin
+
+
+class Llama(AsyncGeneratorProvider, ProviderModelMixin):
+    url = "https://www.llama2.ai"
+    working = True
+    supports_message_history = True
+    default_model = "meta/llama-3-70b-chat"
+    models = [
+        "meta/llama-2-7b-chat",
+        "meta/llama-2-13b-chat",
+        "meta/llama-2-70b-chat",
+        "meta/llama-3-8b-chat",
+        "meta/llama-3-70b-chat",
+    ]
+    model_aliases = {
+        "meta-llama/Meta-Llama-3-8b": "meta/llama-3-8b-chat",
+        "meta-llama/Meta-Llama-3-70b": "meta/llama-3-70b-chat",
+        "meta-llama/Llama-2-7b-chat-hf": "meta/llama-2-7b-chat",
+        "meta-llama/Llama-2-13b-chat-hf": "meta/llama-2-13b-chat",
+        "meta-llama/Llama-2-70b-chat-hf": "meta/llama-2-70b-chat",
+    }
+
+    @classmethod
+    async def create_async_generator(
+        cls,
+        model: str,
+        messages: Messages,
+        proxy: str = None,
+        system_message: str = "You are a helpful assistant.",
+        temperature: float = 0.75,
+        top_p: float = 0.9,
+        max_tokens: int = 8000,
+        **kwargs
+    ) -> AsyncResult:
+        headers = {
+            "User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/118.0",
+            "Accept": "*/*",
+            "Accept-Language": "de,en-US;q=0.7,en;q=0.3",
+            "Accept-Encoding": "gzip, deflate, br",
+            "Referer": f"{cls.url}/",
+            "Content-Type": "text/plain;charset=UTF-8",
+            "Origin": cls.url,
+            "Connection": "keep-alive",
+            "Sec-Fetch-Dest": "empty",
+            "Sec-Fetch-Mode": "cors",
+            "Sec-Fetch-Site": "same-origin",
+            "Pragma": "no-cache",
+            "Cache-Control": "no-cache",
+            "TE": "trailers"
+        }
+        async with ClientSession(headers=headers) as session:
+            system_messages = [message["content"] for message in messages if message["role"] == "system"]
+            if system_messages:
+                system_message = "\n".join(system_messages)
+                messages = [message for message in messages if message["role"] != "system"] 
+            prompt = format_prompt(messages)
+            data = {
+                "prompt": prompt,
+                "model": cls.get_model(model),
+                "systemPrompt": system_message,
+                "temperature": temperature,
+                "topP": top_p,
+                "maxTokens": max_tokens,
+                "image": None
+            }
+            started = False
+            async with session.post(f"{cls.url}/api", json=data, proxy=proxy) as response:
+                await raise_for_status(response)
+                async for chunk in response.content.iter_any():
+                    if not chunk:
+                        continue
+                    if not started:
+                        chunk = chunk.lstrip()
+                        started = True
+                    yield chunk.decode(errors="ignore")
+            
+def format_prompt(messages: Messages):
+    messages = [
+        f"[INST] {message['content']} [/INST]"
+        if message["role"] == "user"
+        else message["content"]
+        for message in messages
+    ]
+    return "\n".join(messages) + "\n"
diff --git a/g4f/Provider/Llama2.py b/g4f/Provider/Llama2.py
deleted file mode 100644
index 04b5aee0..00000000
--- a/g4f/Provider/Llama2.py
+++ /dev/null
@@ -1,87 +0,0 @@
-from __future__ import annotations
-
-from aiohttp import ClientSession
-
-from ..typing import AsyncResult, Messages
-from ..requests.raise_for_status import raise_for_status
-from .base_provider import AsyncGeneratorProvider, ProviderModelMixin
-
-
-class Llama2(AsyncGeneratorProvider, ProviderModelMixin):
-    url = "https://www.llama2.ai"
-    working = True
-    supports_message_history = True
-    default_model = "meta/llama-2-70b-chat"
-    models = [
-        "meta/llama-2-7b-chat",
-        "meta/llama-2-13b-chat",
-        "meta/llama-2-70b-chat",
-    ]
-    model_aliases = {
-        "meta-llama/Llama-2-7b-chat-hf": "meta/llama-2-7b-chat",
-        "meta-llama/Llama-2-13b-chat-hf": "meta/llama-2-13b-chat",
-        "meta-llama/Llama-2-70b-chat-hf": "meta/llama-2-70b-chat",
-    }
-
-    @classmethod
-    async def create_async_generator(
-        cls,
-        model: str,
-        messages: Messages,
-        proxy: str = None,
-        system_message: str = "You are a helpful assistant.",
-        temperature: float = 0.75,
-        top_p: float = 0.9,
-        max_tokens: int = 8000,
-        **kwargs
-    ) -> AsyncResult:
-        headers = {
-            "User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/118.0",
-            "Accept": "*/*",
-            "Accept-Language": "de,en-US;q=0.7,en;q=0.3",
-            "Accept-Encoding": "gzip, deflate, br",
-            "Referer": f"{cls.url}/",
-            "Content-Type": "text/plain;charset=UTF-8",
-            "Origin": cls.url,
-            "Connection": "keep-alive",
-            "Sec-Fetch-Dest": "empty",
-            "Sec-Fetch-Mode": "cors",
-            "Sec-Fetch-Site": "same-origin",
-            "Pragma": "no-cache",
-            "Cache-Control": "no-cache",
-            "TE": "trailers"
-        }
-        async with ClientSession(headers=headers) as session:
-            system_messages = [message["content"] for message in messages if message["role"] == "system"]
-            if system_messages:
-                system_message = "\n".join(system_messages)
-                messages = [message for message in messages if message["role"] != "system"] 
-            prompt = format_prompt(messages)
-            data = {
-                "prompt": prompt,
-                "model": cls.get_model(model),
-                "systemPrompt": system_message,
-                "temperature": temperature,
-                "topP": top_p,
-                "maxTokens": max_tokens,
-                "image": None
-            }
-            started = False
-            async with session.post(f"{cls.url}/api", json=data, proxy=proxy) as response:
-                await raise_for_status(response)
-                async for chunk in response.content.iter_any():
-                    if not chunk:
-                        continue
-                    if not started:
-                        chunk = chunk.lstrip()
-                        started = True
-                    yield chunk.decode(errors="ignore")
-            
-def format_prompt(messages: Messages):
-    messages = [
-        f"[INST] {message['content']} [/INST]"
-        if message["role"] == "user"
-        else message["content"]
-        for message in messages
-    ]
-    return "\n".join(messages) + "\n"
diff --git a/g4f/Provider/__init__.py b/g4f/Provider/__init__.py
index d5913e3c..f761df5b 100644
--- a/g4f/Provider/__init__.py
+++ b/g4f/Provider/__init__.py
@@ -40,7 +40,7 @@ from .HuggingChat      import HuggingChat
 from .HuggingFace      import HuggingFace
 from .Koala            import Koala
 from .Liaobots         import Liaobots
-from .Llama2           import Llama2
+from .Llama            import Llama
 from .Local            import Local
 from .PerplexityLabs   import PerplexityLabs
 from .Pi               import Pi
-- 
cgit v1.2.3