LittleMonkeyLab commited on
Commit
95da712
·
verified ·
1 Parent(s): a2e761d

Upload app.py with huggingface_hub

Browse files
Files changed (1) hide show
  1. app.py +6 -3
app.py CHANGED
@@ -1,11 +1,14 @@
1
  import os
2
  import gradio as gr
3
- from huggingface_hub import InferenceClient
4
 
5
- client = InferenceClient(token=os.getenv("HF_TOKEN"))
 
 
 
6
 
7
  def chat(message, history):
8
- response = client.chat_completion(
9
  model="HuggingFaceH4/zephyr-7b-beta",
10
  messages=[{"role": "user", "content": message}],
11
  max_tokens=256
 
1
  import os
2
  import gradio as gr
3
+ from openai import OpenAI
4
 
5
+ client = OpenAI(
6
+ base_url="https://router.huggingface.co/v1",
7
+ api_key=os.getenv("HF_TOKEN")
8
+ )
9
 
10
  def chat(message, history):
11
+ response = client.chat.completions.create(
12
  model="HuggingFaceH4/zephyr-7b-beta",
13
  messages=[{"role": "user", "content": message}],
14
  max_tokens=256