Huacaya_ChatNew

Paused

App Files Files Community

Henry Hommel commited on Jul 7, 2023

Commit

86e2896

1 Parent(s): c0c2128

Update clbaseimplementation.py

Browse files

Files changed (1) hide show

clbaseimplementation.py +19 -34

clbaseimplementation.py CHANGED Viewed

@@ -1,33 +1,18 @@
-from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer, BitsAndBytesConfig
-from langchain.text_splitter import RecursiveCharacterTextSplitter,CharacterTextSplitter
-from langchain.vectorstores import Chroma
-from langchain.document_loaders import PyPDFLoader
-from langchain.embeddings import HuggingFaceEmbeddings
-from threading import Thread
-import io
-import chainlit as cl
-import torch
-import time
-import tempfile
-from transformers import AutoModelForCausalLM, AutoTokenizer, TextIteratorStreamer
-from langchain.text_splitter import RecursiveCharacterTextSplitter
-from langchain.vectorstores import Chroma
-from langchain.document_loaders import PyPDFLoader
-from langchain.embeddings import HuggingFaceEmbeddings
-from threading import Thread
 import chainlit as cl
-import torch
-import time
-import random
-import openai
 #load model
-openai.api_key = "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"
 @cl.on_chat_start
 async def main():
-    cl.user_session.set("history", [
-                {"role": "system", "content": "You are a language model named Huacaya. You are build on the Falcon 40b language Model. Never Say that you are Chat GPT or made by OpenAI. You have been developed by Leadvise Reply!"},
-            ])
     msg = cl.Message(content=f"Loading Chat please wait ...")
     await msg.send()
@@ -42,19 +27,19 @@ async def main():
 @cl.on_message
 async def main(message: str):
     h = cl.user_session.get("history")
-    h.append({"role": "user", "content":message})
     resp = ""
     msg = cl.Message(content="")
-    async for stream_resp in await openai.ChatCompletion.acreate(model="gpt-3.5-turbo",messages=h,stream = True):
-        print(stream_resp)
-        token = stream_resp.get("choices")[0].get("delta").get("content")
-        if token:
-            delay = random.uniform(0.0, 0.1)
-            time.sleep(delay)
             resp += token
             await msg.stream_token(token)
-    h.append({"role": "assistant", "content":resp})
     cl.user_session.set("history",h)
     print(h)
     await msg.send()

 import chainlit as cl
+from huggingface_hub import AsyncInferenceClient
 #load model
+API_TOKEN = "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"
+headers = {"Authorization": f"Bearer {API_TOKEN}","Content-Type": "application/json"}
+API_URL = "https://kfsb1xfskc2136wg.eu-west-1.aws.endpoints.huggingface.cloud"
+client = AsyncInferenceClient(model=API_URL,token=API_TOKEN)
 @cl.on_chat_start
 async def main():
+    cl.user_session.set("history", [])
     msg = cl.Message(content=f"Loading Chat please wait ...")
     await msg.send()
 @cl.on_message
 async def main(message: str):
     h = cl.user_session.get("history")
+    h.append("<|prompter|>"+message+"<|endoftext|><|assistant|>")
     resp = ""
     msg = cl.Message(content="")
+    async for token in await client.text_generation("".join(h), stream=True,max_new_tokens =250):
+        if token!="<|endoftext|>":
+            print(token, end="")
             resp += token
             await msg.stream_token(token)
+    h.append(resp+"<|endoftext|>")
     cl.user_session.set("history",h)
     print(h)
     await msg.send()