|
from __future__ import annotations |
|
|
|
import json |
|
import uuid |
|
|
|
from aiohttp import ClientSession |
|
|
|
from ..typing import AsyncGenerator |
|
from .base_provider import AsyncGeneratorProvider, format_prompt |
|
|
|
|
|
class H2o(AsyncGeneratorProvider): |
|
url = "https://gpt-gm.h2o.ai" |
|
working = True |
|
model = "h2oai/h2ogpt-gm-oasst1-en-2048-falcon-40b-v1" |
|
|
|
@classmethod |
|
async def create_async_generator( |
|
cls, |
|
model: str, |
|
messages: list[dict[str, str]], |
|
proxy: str = None, |
|
**kwargs |
|
) -> AsyncGenerator: |
|
model = model if model else cls.model |
|
headers = {"Referer": cls.url + "/"} |
|
|
|
async with ClientSession( |
|
headers=headers |
|
) as session: |
|
data = { |
|
"ethicsModalAccepted": "true", |
|
"shareConversationsWithModelAuthors": "true", |
|
"ethicsModalAcceptedAt": "", |
|
"activeModel": model, |
|
"searchEnabled": "true", |
|
} |
|
async with session.post( |
|
f"{cls.url}/settings", |
|
proxy=proxy, |
|
data=data |
|
) as response: |
|
response.raise_for_status() |
|
|
|
async with session.post( |
|
f"{cls.url}/conversation", |
|
proxy=proxy, |
|
json={"model": model}, |
|
) as response: |
|
response.raise_for_status() |
|
conversationId = (await response.json())["conversationId"] |
|
|
|
data = { |
|
"inputs": format_prompt(messages), |
|
"parameters": { |
|
"temperature": 0.4, |
|
"truncate": 2048, |
|
"max_new_tokens": 1024, |
|
"do_sample": True, |
|
"repetition_penalty": 1.2, |
|
"return_full_text": False, |
|
**kwargs |
|
}, |
|
"stream": True, |
|
"options": { |
|
"id": str(uuid.uuid4()), |
|
"response_id": str(uuid.uuid4()), |
|
"is_retry": False, |
|
"use_cache": False, |
|
"web_search_id": "", |
|
}, |
|
} |
|
async with session.post( |
|
f"{cls.url}/conversation/{conversationId}", |
|
proxy=proxy, |
|
json=data |
|
) as response: |
|
start = "data:" |
|
async for line in response.content: |
|
line = line.decode("utf-8") |
|
if line and line.startswith(start): |
|
line = json.loads(line[len(start):-1]) |
|
if not line["token"]["special"]: |
|
yield line["token"]["text"] |
|
|
|
async with session.delete( |
|
f"{cls.url}/conversation/{conversationId}", |
|
proxy=proxy, |
|
json=data |
|
) as response: |
|
response.raise_for_status() |
|
|
|
|
|
@classmethod |
|
@property |
|
def params(cls): |
|
params = [ |
|
("model", "str"), |
|
("messages", "list[dict[str, str]]"), |
|
("stream", "bool"), |
|
("temperature", "float"), |
|
("truncate", "int"), |
|
("max_new_tokens", "int"), |
|
("do_sample", "bool"), |
|
("repetition_penalty", "float"), |
|
("return_full_text", "bool"), |
|
] |
|
param = ", ".join([": ".join(p) for p in params]) |
|
return f"g4f.provider.{cls.__name__} supports: ({param})" |
|
|