|
from __future__ import annotations |
|
|
|
import json |
|
|
|
from aiohttp import ClientSession |
|
|
|
from ..typing import AsyncGenerator |
|
from .base_provider import AsyncGeneratorProvider, format_prompt, get_cookies |
|
|
|
|
|
class HuggingChat(AsyncGeneratorProvider): |
|
url = "https://huggingface.co/chat" |
|
needs_auth = True |
|
working = True |
|
model = "OpenAssistant/oasst-sft-6-llama-30b-xor" |
|
|
|
@classmethod |
|
async def create_async_generator( |
|
cls, |
|
model: str, |
|
messages: list[dict[str, str]], |
|
stream: bool = True, |
|
proxy: str = None, |
|
cookies: dict = None, |
|
**kwargs |
|
) -> AsyncGenerator: |
|
model = model if model else cls.model |
|
if proxy and "://" not in proxy: |
|
proxy = f"http://{proxy}" |
|
if not cookies: |
|
cookies = get_cookies(".huggingface.co") |
|
|
|
headers = { |
|
'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36', |
|
} |
|
async with ClientSession( |
|
cookies=cookies, |
|
headers=headers |
|
) as session: |
|
async with session.post(f"{cls.url}/conversation", proxy=proxy, json={"model": model}) as response: |
|
conversation_id = (await response.json())["conversationId"] |
|
|
|
send = { |
|
"inputs": format_prompt(messages), |
|
"parameters": { |
|
"temperature": 0.2, |
|
"truncate": 1000, |
|
"max_new_tokens": 1024, |
|
"stop": ["</s>"], |
|
"top_p": 0.95, |
|
"repetition_penalty": 1.2, |
|
"top_k": 50, |
|
"return_full_text": False, |
|
**kwargs |
|
}, |
|
"stream": stream, |
|
"options": { |
|
"id": "9e9b8bc4-6604-40c6-994e-8eb78fa32e37", |
|
"response_id": "04ce2602-3bea-45e8-8efc-cef00680376a", |
|
"is_retry": False, |
|
"use_cache": False, |
|
"web_search_id": "" |
|
} |
|
} |
|
async with session.post(f"{cls.url}/conversation/{conversation_id}", proxy=proxy, json=send) as response: |
|
if not stream: |
|
data = await response.json() |
|
if "error" in data: |
|
raise RuntimeError(data["error"]) |
|
elif isinstance(data, list): |
|
yield data[0]["generated_text"].strip() |
|
else: |
|
raise RuntimeError(f"Response: {data}") |
|
else: |
|
start = "data:" |
|
first = True |
|
async for line in response.content: |
|
line = line.decode("utf-8") |
|
if line.startswith(start): |
|
line = json.loads(line[len(start):-1]) |
|
if "token" not in line: |
|
raise RuntimeError(f"Response: {line}") |
|
if not line["token"]["special"]: |
|
if first: |
|
yield line["token"]["text"].lstrip() |
|
first = False |
|
else: |
|
yield line["token"]["text"] |
|
|
|
async with session.delete(f"{cls.url}/conversation/{conversation_id}", proxy=proxy) as response: |
|
response.raise_for_status() |
|
|
|
|
|
@classmethod |
|
@property |
|
def params(cls): |
|
params = [ |
|
("model", "str"), |
|
("messages", "list[dict[str, str]]"), |
|
("stream", "bool"), |
|
("proxy", "str"), |
|
] |
|
param = ", ".join([": ".join(p) for p in params]) |
|
return f"g4f.provider.{cls.__name__} supports: ({param})" |
|
|