File size: 686 Bytes
e8cc01c
bdd0c15
e8cc01c
5c98715
bdd0c15
 
79fd528
edfbc1e
bdd0c15
 
5c98715
 
edfbc1e
 
 
 
 
 
 
 
 
 
 
5c98715
edfbc1e
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
import gradio as gr
from huggingface_hub import InferenceClient

client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")

def respond(message, history):
    messages = [{"role": "system", "content": "You are a nice chatbot."}]
    
    if history:
        messages.extend(history)
    messages.append({"role": "user", "content": message})
    response = ""
   
    for message in client.chat_completion(
        messages,
        max_tokens=500,
        temperature=0.2,
        top_p=0.9,
        stream=True
    ):
        token = message.choices[0].delta.content
        response += token
        yield response
chatbot = gr.ChatInterface(respond, type="messages")
chatbot.launch()