Spaces:

daniloedu
/

different_llms

Runtime error

App Files Files Community

daniloedu commited on Aug 3, 2023

Commit

3d441a2

1 Parent(s): f9d442c

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -12

app.py CHANGED Viewed

@@ -1,15 +1,55 @@
 import gradio as gr
 from transformers import pipeline
-pipeline = pipeline(task="image-classification", model="julien-c/hotdog-not-hotdog")
-def predict(image):
-    predictions = pipeline(image)
-    return {p["label"]: p["score"] for p in predictions}
-gr.Interface(
-    predict,
-    inputs=gr.inputs.Image(label="Upload hot dog candidate", type="filepath"),
-    outputs=gr.outputs.Label(num_top_classes=2),
-    title="Hot Dog? Or Not?",
-).launch()

 import gradio as gr
 from transformers import pipeline
+client = pipeline("text-generation", model="upstage/Llama-2-70b-instruct", api_url=API_URL)
+def format_chat_prompt(message, chat_history, instruction):
+    prompt = f"System:{instruction}"
+    for turn in chat_history:
+        user_message, bot_message = turn
+        prompt = f"{prompt}\nUser: {user_message}\nAssistant: {bot_message}"
+    prompt = f"{prompt}\nUser: {message}\nAssistant:"
+    return prompt
+def respond(message, chat_history, instruction, temperature=0.7):
+    prompt = format_chat_prompt(message, chat_history, instruction)
+    chat_history = chat_history + [[message, ""]]
+    stream = client.generate_stream(prompt,
+                                      max_new_tokens=1024,
+                                      stop_sequences=["\nUser:", "<|endoftext|>"],
+                                      temperature=temperature)
+                                      #stop_sequences to not generate the user answer
+    acc_text = ""
+    #Streaming the tokens
+    for idx, response in enumerate(stream):
+            text_token = response.token.text
+            if response.details:
+                return
+            if idx == 0 and text_token.startswith(" "):
+                text_token = text_token[1:]
+            if any(word in text_token for word in SAFETY_GUIDELINES):
+                continue
+            acc_text += text_token
+            last_turn = list(chat_history.pop(-1))
+            last_turn[-1] += acc_text
+            chat_history = chat_history + [last_turn]
+            yield "", chat_history
+            acc_text = ""
+with gr.Blocks() as demo:
+    chatbot = gr.Chatbot(height=240) #just to fit the notebook
+    msg = gr.Textbox(label="Prompt")
+    with gr.Accordion(label="Advanced options",open=False):
+        system = gr.Textbox(label="System message", lines=2, value="A conversation between a user and an LLM-based AI assistant. The assistant gives helpful and honest answers.")
+        temperature = gr.Slider(label="temperature", minimum=0.1, maximum=1, value=0.7, step=0.1)
+    btn = gr.Button("Submit")
+    clear = gr.ClearButton(components=[msg, chatbot], value="Clear console")
+    btn.click(respond, inputs=[msg, chatbot, system], outputs=[msg, chatbot])
+    msg.submit(respond, inputs=[msg, chatbot, system], outputs=[msg, chatbot]) #Press enter to submit
+gr.close_all()
+demo.queue().launch(share=True, server_port=int(os.environ['PORT4']))