Spaces:

duduvicky
/

chen_chat

Sleeping

duduvicky commited on Oct 4, 2025

Commit

4b5bc7a

verified ·

1 Parent(s): b891be1

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,12 +3,12 @@ from langchain_huggingface import HuggingFacePipeline
 from langchain.chains import ConversationChain
 from langchain.memory import ConversationBufferMemory
-# Load lightweight model (distilgpt2, ~82M parameters, fast on CPU)
 llm = HuggingFacePipeline.from_model_id(
     model_id="distilgpt2",
     task="text-generation",
     pipeline_kwargs={
-        "max_new_tokens": 120,  # Very short responses for speed
         "do_sample": True,
         "temperature": 0.7,    # Balanced creativity
         "top_k": 40,
@@ -30,23 +30,26 @@ conversation = ConversationChain(
 def chat_with_agent(message, history):
     try:
         response = conversation.predict(input=message)
-        # Clean up response to avoid verbosity
-        response = response.strip().split("\n")[0][:200]  # Limit to 200 chars
-        return response
     except Exception as e:
-        return f"Oops, something went wrong: {str(e)}. Try again!"
 # Gradio chat interface
 iface = gr.ChatInterface(
     fn=chat_with_agent,
-    title="Your AI Chat Buddy",
-    description="I'm here to talk with you and remember our conversation! Ask me anything, and I'll respond in a few seconds. Hosted free on Hugging Face Spaces.",
-    examples=[
-        "My name is Alex. What's my name?",
-        "Tell me a quick joke."
-    ]
 )
-# Launch the app
 if __name__ == "__main__":
     iface.launch()

 from langchain.chains import ConversationChain
 from langchain.memory import ConversationBufferMemory
+# Load a very lightweight model (distilgpt2, ~82M parameters, fast on CPU)
 llm = HuggingFacePipeline.from_model_id(
     model_id="distilgpt2",
     task="text-generation",
     pipeline_kwargs={
+        "max_new_tokens": 100,  # Short responses for speed
         "do_sample": True,
         "temperature": 0.7,    # Balanced creativity
         "top_k": 40,
 def chat_with_agent(message, history):
     try:
         response = conversation.predict(input=message)
+        # Clean up response (distilgpt2 can be verbose)
+        response = response.strip().split("\n")[0]
     except Exception as e:
+        response = f"Error: {str(e)}. Try rephrasing your question."
+    return response
 # Gradio chat interface
 iface = gr.ChatInterface(
     fn=chat_with_agent,
+    title="Fast Free AI Agent",
+    description="A lightweight conversational AI that remembers our talks. Hosted free on Hugging Face Spaces. Responses in ~3-10 seconds.",
+    examples=["My name is Alex. What's my name?", "Tell me a short joke."]
 )
+# Add a clear memory button
+def clear_memory():
+    memory.clear()
+    return "Conversation history cleared!"
+iface.additional_inputs = [gr.Button("Clear Memory", onclick=clear_memory)]
 if __name__ == "__main__":
     iface.launch()