summaryrefslogtreecommitdiffstats
path: root/g4f/Provider/Llama.py
diff options
context:
space:
mode:
Diffstat (limited to 'g4f/Provider/Llama.py')
-rw-r--r--g4f/Provider/Llama.py91
1 files changed, 91 insertions, 0 deletions
diff --git a/g4f/Provider/Llama.py b/g4f/Provider/Llama.py
new file mode 100644
index 00000000..4d19866e
--- /dev/null
+++ b/g4f/Provider/Llama.py
@@ -0,0 +1,91 @@
+from __future__ import annotations
+
+from aiohttp import ClientSession
+
+from ..typing import AsyncResult, Messages
+from ..requests.raise_for_status import raise_for_status
+from .base_provider import AsyncGeneratorProvider, ProviderModelMixin
+
+
+class Llama(AsyncGeneratorProvider, ProviderModelMixin):
+ url = "https://www.llama2.ai"
+ working = True
+ supports_message_history = True
+ default_model = "meta/llama-3-70b-chat"
+ models = [
+ "meta/llama-2-7b-chat",
+ "meta/llama-2-13b-chat",
+ "meta/llama-2-70b-chat",
+ "meta/llama-3-8b-chat",
+ "meta/llama-3-70b-chat",
+ ]
+ model_aliases = {
+ "meta-llama/Meta-Llama-3-8b": "meta/llama-3-8b-chat",
+ "meta-llama/Meta-Llama-3-70b": "meta/llama-3-70b-chat",
+ "meta-llama/Llama-2-7b-chat-hf": "meta/llama-2-7b-chat",
+ "meta-llama/Llama-2-13b-chat-hf": "meta/llama-2-13b-chat",
+ "meta-llama/Llama-2-70b-chat-hf": "meta/llama-2-70b-chat",
+ }
+
+ @classmethod
+ async def create_async_generator(
+ cls,
+ model: str,
+ messages: Messages,
+ proxy: str = None,
+ system_message: str = "You are a helpful assistant.",
+ temperature: float = 0.75,
+ top_p: float = 0.9,
+ max_tokens: int = 8000,
+ **kwargs
+ ) -> AsyncResult:
+ headers = {
+ "User-Agent": "Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:109.0) Gecko/20100101 Firefox/118.0",
+ "Accept": "*/*",
+ "Accept-Language": "de,en-US;q=0.7,en;q=0.3",
+ "Accept-Encoding": "gzip, deflate, br",
+ "Referer": f"{cls.url}/",
+ "Content-Type": "text/plain;charset=UTF-8",
+ "Origin": cls.url,
+ "Connection": "keep-alive",
+ "Sec-Fetch-Dest": "empty",
+ "Sec-Fetch-Mode": "cors",
+ "Sec-Fetch-Site": "same-origin",
+ "Pragma": "no-cache",
+ "Cache-Control": "no-cache",
+ "TE": "trailers"
+ }
+ async with ClientSession(headers=headers) as session:
+ system_messages = [message["content"] for message in messages if message["role"] == "system"]
+ if system_messages:
+ system_message = "\n".join(system_messages)
+ messages = [message for message in messages if message["role"] != "system"]
+ prompt = format_prompt(messages)
+ data = {
+ "prompt": prompt,
+ "model": cls.get_model(model),
+ "systemPrompt": system_message,
+ "temperature": temperature,
+ "topP": top_p,
+ "maxTokens": max_tokens,
+ "image": None
+ }
+ started = False
+ async with session.post(f"{cls.url}/api", json=data, proxy=proxy) as response:
+ await raise_for_status(response)
+ async for chunk in response.content.iter_any():
+ if not chunk:
+ continue
+ if not started:
+ chunk = chunk.lstrip()
+ started = True
+ yield chunk.decode(errors="ignore")
+
+def format_prompt(messages: Messages):
+ messages = [
+ f"[INST] {message['content']} [/INST]"
+ if message["role"] == "user"
+ else message["content"]
+ for message in messages
+ ]
+ return "\n".join(messages) + "\n"