Spaces:
Sleeping
Sleeping
mvkvc
commited on
Commit
·
6fe4e50
1
Parent(s):
f009e61
Add streaming toggle
Browse files- README.md +1 -1
- app.py +34 -24
- poetry.lock +0 -0
- requirements.txt +0 -0
- sh/reqs.sh +1 -1
- sh/start.sh +1 -1
README.md
CHANGED
|
@@ -7,7 +7,7 @@ sdk: gradio
|
|
| 7 |
sdk_version: 4.24.0
|
| 8 |
app_file: app.py
|
| 9 |
pinned: false
|
| 10 |
-
short_description: '
|
| 11 |
---
|
| 12 |
|
| 13 |
Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference.
|
|
|
|
| 7 |
sdk_version: 4.24.0
|
| 8 |
app_file: app.py
|
| 9 |
pinned: false
|
| 10 |
+
short_description: 'Learn more at https://replicantzk.com.'
|
| 11 |
---
|
| 12 |
|
| 13 |
Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference.
|
app.py
CHANGED
|
@@ -1,13 +1,22 @@
|
|
|
|
|
| 1 |
from openai import AsyncOpenAI
|
| 2 |
import gradio as gr
|
| 3 |
|
| 4 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5 |
|
| 6 |
-
async def predict(message, history, model, temperature):
|
| 7 |
history_openai_format = []
|
| 8 |
for human, assistant in history:
|
| 9 |
history_openai_format.append({"role": "user", "content": human})
|
| 10 |
history_openai_format.append({"role": "assistant", "content": assistant})
|
|
|
|
| 11 |
history_openai_format.append({"role": "user", "content": message})
|
| 12 |
|
| 13 |
try:
|
|
@@ -15,31 +24,32 @@ async def predict(message, history, model, temperature):
|
|
| 15 |
model=model,
|
| 16 |
messages=history_openai_format,
|
| 17 |
temperature=temperature,
|
| 18 |
-
stream=
|
| 19 |
)
|
| 20 |
|
| 21 |
-
|
| 22 |
-
|
| 23 |
-
|
| 24 |
-
|
| 25 |
-
|
|
|
|
|
|
|
|
|
|
| 26 |
|
| 27 |
except Exception as e:
|
| 28 |
-
|
| 29 |
-
|
| 30 |
-
|
| 31 |
-
|
| 32 |
-
|
| 33 |
-
|
| 34 |
-
|
| 35 |
-
|
| 36 |
-
|
|
|
|
|
|
|
|
|
|
| 37 |
)
|
| 38 |
-
temperature_slider = gr.Slider(0, 1, value=0, label="Temperature")
|
| 39 |
-
api_key = gr.Textbox(label="OpenAI API Key")
|
| 40 |
-
|
| 41 |
-
desc = "Learn more and join here: https://replicantzk.com."
|
| 42 |
|
| 43 |
-
|
| 44 |
-
|
| 45 |
-
).launch()
|
|
|
|
| 1 |
+
import os
|
| 2 |
from openai import AsyncOpenAI
|
| 3 |
import gradio as gr
|
| 4 |
|
| 5 |
+
default_model = "llama3:8b-instruct-q4_K_M"
|
| 6 |
+
models = ["llama3:8b-instruct-q4_K_M", "codestral:22b-v0.1-q4_K_M"]
|
| 7 |
+
description = "Learn more at https://replicantzk.com."
|
| 8 |
+
base_url = os.getenv("OPENAI_BASE_URL") or "https://platform.replicantzk.com"
|
| 9 |
+
api_key = os.getenv("OPENAI_API_KEY")
|
| 10 |
+
|
| 11 |
+
|
| 12 |
+
async def predict(message, history, model, temperature, stream, base_url, api_key):
|
| 13 |
+
client = AsyncOpenAI(base_url=base_url, api_key=api_key)
|
| 14 |
|
|
|
|
| 15 |
history_openai_format = []
|
| 16 |
for human, assistant in history:
|
| 17 |
history_openai_format.append({"role": "user", "content": human})
|
| 18 |
history_openai_format.append({"role": "assistant", "content": assistant})
|
| 19 |
+
|
| 20 |
history_openai_format.append({"role": "user", "content": message})
|
| 21 |
|
| 22 |
try:
|
|
|
|
| 24 |
model=model,
|
| 25 |
messages=history_openai_format,
|
| 26 |
temperature=temperature,
|
| 27 |
+
stream=stream,
|
| 28 |
)
|
| 29 |
|
| 30 |
+
if stream:
|
| 31 |
+
partial_message = ""
|
| 32 |
+
async for chunk in response:
|
| 33 |
+
if chunk.choices[0].delta.content is not None:
|
| 34 |
+
partial_message += chunk.choices[0].delta.content
|
| 35 |
+
yield partial_message
|
| 36 |
+
else:
|
| 37 |
+
yield response.choices[0].message.content
|
| 38 |
|
| 39 |
except Exception as e:
|
| 40 |
+
raise gr.Error(str(e))
|
| 41 |
+
|
| 42 |
+
|
| 43 |
+
model = gr.Dropdown(label="Model", choices=models, value=default_model)
|
| 44 |
+
temperature = gr.Slider(0, 1, value=0, label="Temperature")
|
| 45 |
+
stream = gr.Checkbox(value=True, label="Stream")
|
| 46 |
+
base_url = gr.Textbox(label="OpenAI-compatible base URL", value=base_url)
|
| 47 |
+
api_key = gr.Textbox(label="OpenAI-compatible API key", type="password", value=api_key)
|
| 48 |
+
demo = gr.ChatInterface(
|
| 49 |
+
fn=predict,
|
| 50 |
+
additional_inputs=[model, temperature, stream, base_url, api_key],
|
| 51 |
+
description=description,
|
| 52 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
| 53 |
|
| 54 |
+
if __name__ == "__main__":
|
| 55 |
+
demo.launch()
|
|
|
poetry.lock
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
requirements.txt
CHANGED
|
The diff for this file is too large to render.
See raw diff
|
|
|
sh/reqs.sh
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
#! /bin/sh
|
| 2 |
|
| 3 |
-
poetry export -f requirements.txt --output requirements.txt
|
|
|
|
| 1 |
#! /bin/sh
|
| 2 |
|
| 3 |
+
poetry export -f requirements.txt --output ./requirements.txt
|
sh/start.sh
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
#! /bin/sh
|
| 2 |
|
| 3 |
-
poetry run
|
|
|
|
| 1 |
#! /bin/sh
|
| 2 |
|
| 3 |
+
poetry run gradio ./app.py
|