Spaces:

llmc
/

llmc_1558M

Runtime error

App Files Files Community

eliebak HF Staff commited on Jul 11, 2024

Commit

49dac5b

verified ·

1 Parent(s): 55e69ee

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -49

app.py CHANGED Viewed

@@ -6,21 +6,13 @@ import torch
 import spaces
 # Initialize the client with your model
-client = InferenceClient("karpathy/gpt2_1558M_final2_hf") # Replace with your model's name or endpoint
-default_system = 'You are a helpful assistant'
 @spaces.GPU
-def respond(message, history, system_message, max_tokens, temperature, top_p):
-    # Combine system message, history, and new message
-    full_prompt = f"{system_message}\n\n"
-    for user, assistant in history:
-        full_prompt += f"Human: {user}\nAssistant: {assistant}\n"
-    full_prompt += f"Human: {message}\nAssistant:"
     response = ""
     for chunk in client.text_generation(
-        full_prompt,
         max_new_tokens=max_tokens,
         stream=True,
         temperature=temperature,
@@ -32,51 +24,28 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
             response += chunk.token.text
         elif hasattr(chunk, 'generated_text'):
             response += chunk.generated_text
-        yield history + [(message, response)]
-    # If the response is empty, yield a default message
     if not response:
-        yield history + [(message, "I apologize, but I couldn't generate a response.")]
-def clear_session():
-    return "", []
-def modify_system_session(system):
-    if not system:
-        system = default_system
-    return system, system, []
-def use_example(example):
-    return example
-def set_unicorn_example():
-    return unicorn_example
-def set_time_travel_example():
-    return time_travel_example
 # Define example prompts
 unicorn_example = "In a shocking finding, scientist discovered a herd of unicorns living in a remote, previously unexplored valley, in the Andes Mountains. Even more surprising to the researchers was the fact that the unicorns spoke perfect English."
 time_travel_example = "Explain the grandfather paradox in time travel and propose a potential resolution."
 with gr.Blocks() as demo:
-    gr.Markdown("<h1 style='text-align: center;'>LLM.C 1.5B Chat Demo (GPT-2 1.5B)</h1>")
-    with gr.Row():
-        with gr.Column(scale=3):
-            system_input = gr.Textbox(value=default_system, lines=1, label='System Prompt')
-        with gr.Column(scale=1):
-            modify_system = gr.Button("🛠️ Set system prompt and clear history")
-    system_state = gr.Textbox(value=default_system, visible=False)
-    chatbot = gr.Chatbot(label='LLM.C Chat')
-    message = gr.Textbox(lines=1, label='Your message')
     with gr.Row():
-        clear_history = gr.Button("🧹 Clear history")
-        submit = gr.Button("🚀 Send")
-    # New section for example prompts
     gr.Markdown("### Example prompts")
     with gr.Row():
         example1 = gr.Button("🦄 Unicorn Discovery")
@@ -88,12 +57,10 @@ with gr.Blocks() as demo:
         top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p (Nucleus Sampling)")
     # Set up event handlers
-    message.submit(respond, inputs=[message, chatbot, system_state, max_tokens, temperature, top_p], outputs=[chatbot])
-    submit.click(respond, inputs=[message, chatbot, system_state, max_tokens, temperature, top_p], outputs=[chatbot])
-    clear_history.click(fn=clear_session, inputs=[], outputs=[message, chatbot])
-    modify_system.click(fn=modify_system_session, inputs=[system_input], outputs=[system_state, system_input, chatbot])
-    example1.click(fn=set_unicorn_example, inputs=[], outputs=[message])
-    example2.click(fn=set_time_travel_example, inputs=[], outputs=[message])
     gr.Markdown(
         """

 import spaces
 # Initialize the client with your model
+client = InferenceClient("karpathy/gpt2_1558M_final2_hf")
 @spaces.GPU
+def generate_text(prompt, max_tokens, temperature, top_p):
     response = ""
     for chunk in client.text_generation(
+        prompt,
         max_new_tokens=max_tokens,
         stream=True,
         temperature=temperature,
             response += chunk.token.text
         elif hasattr(chunk, 'generated_text'):
             response += chunk.generated_text
+        yield response
     if not response:
+        yield "I apologize, but I couldn't generate a response."
+def clear_input():
+    return ""
 # Define example prompts
 unicorn_example = "In a shocking finding, scientist discovered a herd of unicorns living in a remote, previously unexplored valley, in the Andes Mountains. Even more surprising to the researchers was the fact that the unicorns spoke perfect English."
 time_travel_example = "Explain the grandfather paradox in time travel and propose a potential resolution."
 with gr.Blocks() as demo:
+    gr.Markdown("<h1 style='text-align: center;'>LLM.C 1.5B Demo</h1>")
+    prompt = gr.Textbox(lines=3, label='Enter your prompt')
+    output = gr.Textbox(lines=10, label='Generated text')
     with gr.Row():
+        clear_button = gr.Button("🧹 Clear input")
+        submit = gr.Button("🚀 Generate")
     gr.Markdown("### Example prompts")
     with gr.Row():
         example1 = gr.Button("🦄 Unicorn Discovery")
         top_p = gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-p (Nucleus Sampling)")
     # Set up event handlers
+    submit.click(generate_text, inputs=[prompt, max_tokens, temperature, top_p], outputs=output)
+    clear_button.click(clear_input, inputs=[], outputs=prompt)
+    example1.click(lambda: unicorn_example, inputs=[], outputs=prompt)
+    example2.click(lambda: time_travel_example, inputs=[], outputs=prompt)
     gr.Markdown(
         """