import gradio as gr from huggingface_hub import InferenceClient client=InferenceClient("HuggingFaceH4/zephyr-7b-beta") def respond(message, history): messages= [{'role':'system', "content":"You are a friend chatbot"}] if history: messages.extend(history) messages.append({'role':'user','content':message}) response = client.chat_completion( messages, max_tokens = 100, temperature = 0.2 ) return response['choices'][0]['message']['content'].strip() demo = gr.ChatInterface(respond, type="messages", autofocus=False, theme='mgetz/Celeb_glitzy') demo.launch()