Spaces:

Docfile
/

Gza

Runtime error

Gza / g4f /Provider /HuggingChat.py

58e1001 over 2 years ago

3.93 kB

	from __future__ import annotations

	import json

	from aiohttp import ClientSession

	from ..typing import AsyncGenerator
	from .base_provider import AsyncGeneratorProvider, format_prompt, get_cookies


	class HuggingChat(AsyncGeneratorProvider):
	url = "https://huggingface.co/chat"
	needs_auth = True
	working = True
	model = "OpenAssistant/oasst-sft-6-llama-30b-xor"

	@classmethod
	async def create_async_generator(
	cls,
	model: str,
	messages: list[dict[str, str]],
	stream: bool = True,
	proxy: str = None,
	cookies: dict = None,
	**kwargs
	) -> AsyncGenerator:
	model = model if model else cls.model
	if proxy and "://" not in proxy:
	proxy = f"http://{proxy}"
	if not cookies:
	cookies = get_cookies(".huggingface.co")

	headers = {
	'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/111.0.0.0 Safari/537.36',
	}
	async with ClientSession(
	cookies=cookies,
	headers=headers
	) as session:
	async with session.post(f"{cls.url}/conversation", proxy=proxy, json={"model": model}) as response:
	conversation_id = (await response.json())["conversationId"]

	send = {
	"inputs": format_prompt(messages),
	"parameters": {
	"temperature": 0.2,
	"truncate": 1000,
	"max_new_tokens": 1024,
	"stop": ["</s>"],
	"top_p": 0.95,
	"repetition_penalty": 1.2,
	"top_k": 50,
	"return_full_text": False,
	**kwargs
	},
	"stream": stream,
	"options": {
	"id": "9e9b8bc4-6604-40c6-994e-8eb78fa32e37",
	"response_id": "04ce2602-3bea-45e8-8efc-cef00680376a",
	"is_retry": False,
	"use_cache": False,
	"web_search_id": ""
	}
	}
	async with session.post(f"{cls.url}/conversation/{conversation_id}", proxy=proxy, json=send) as response:
	if not stream:
	data = await response.json()
	if "error" in data:
	raise RuntimeError(data["error"])
	elif isinstance(data, list):
	yield data[0]["generated_text"].strip()
	else:
	raise RuntimeError(f"Response: {data}")
	else:
	start = "data:"
	first = True
	async for line in response.content:
	line = line.decode("utf-8")
	if line.startswith(start):
	line = json.loads(line[len(start):-1])
	if "token" not in line:
	raise RuntimeError(f"Response: {line}")
	if not line["token"]["special"]:
	if first:
	yield line["token"]["text"].lstrip()
	first = False
	else:
	yield line["token"]["text"]

	async with session.delete(f"{cls.url}/conversation/{conversation_id}", proxy=proxy) as response:
	response.raise_for_status()


	@classmethod
	@property
	def params(cls):
	params = [
	("model", "str"),
	("messages", "list[dict[str, str]]"),
	("stream", "bool"),
	("proxy", "str"),
	]
	param = ", ".join([": ".join(p) for p in params])
	return f"g4f.provider.{cls.__name__} supports: ({param})"