summaryrefslogtreecommitdiffstats
path: root/g4f/Provider/nexra/NexraLLaMA31.py
diff options
context:
space:
mode:
Diffstat (limited to '')
-rw-r--r--g4f/Provider/nexra/NexraLLaMA31.py83
1 files changed, 83 insertions, 0 deletions
diff --git a/g4f/Provider/nexra/NexraLLaMA31.py b/g4f/Provider/nexra/NexraLLaMA31.py
new file mode 100644
index 00000000..c67febb3
--- /dev/null
+++ b/g4f/Provider/nexra/NexraLLaMA31.py
@@ -0,0 +1,83 @@
+from __future__ import annotations
+
+from aiohttp import ClientSession
+import json
+
+from ...typing import AsyncResult, Messages
+from ..base_provider import AsyncGeneratorProvider, ProviderModelMixin
+from ..helper import format_prompt
+
+
+class NexraLLaMA31(AsyncGeneratorProvider, ProviderModelMixin):
+ label = "Nexra LLaMA 3.1"
+ url = "https://nexra.aryahcr.cc/documentation/llama-3.1/en"
+ api_endpoint = "https://nexra.aryahcr.cc/api/chat/complements"
+ working = True
+ supports_stream = True
+
+ default_model = 'llama-3.1'
+ models = [default_model]
+
+ @classmethod
+ def get_model(cls, model: str) -> str:
+ return cls.default_model
+
+ @classmethod
+ async def create_async_generator(
+ cls,
+ model: str,
+ messages: Messages,
+ proxy: str = None,
+ stream: bool = False,
+ markdown: bool = False,
+ **kwargs
+ ) -> AsyncResult:
+ model = cls.get_model(model)
+
+ headers = {
+ "Content-Type": "application/json"
+ }
+
+ async with ClientSession(headers=headers) as session:
+ prompt = format_prompt(messages)
+ data = {
+ "messages": [
+ {
+ "role": "user",
+ "content": prompt
+ }
+ ],
+ "stream": stream,
+ "markdown": markdown,
+ "model": model
+ }
+
+ async with session.post(f"{cls.api_endpoint}", json=data, proxy=proxy) as response:
+ response.raise_for_status()
+
+ if stream:
+ # Streamed response handling
+ collected_message = ""
+ async for chunk in response.content.iter_any():
+ if chunk:
+ decoded_chunk = chunk.decode().strip().split("\x1e")
+ for part in decoded_chunk:
+ if part:
+ message_data = json.loads(part)
+
+ # Collect messages until 'finish': true
+ if 'message' in message_data and message_data['message']:
+ collected_message = message_data['message']
+
+ # When finish is true, yield the final collected message
+ if message_data.get('finish', False):
+ yield collected_message
+ return
+ else:
+ # Non-streamed response handling
+ response_data = await response.json(content_type=None)
+
+ # Yield the message directly from the response
+ if 'message' in response_data and response_data['message']:
+ yield response_data['message']
+ return