Spaces:

nashjiwani
/

AssistAI

Sleeping

App Files Files Community

nashjiwani commited on Sep 24, 2025

Commit

2dbba12

verified ·

1 Parent(s): 6a2c4b8

Update app.py

Browse files

Files changed (1) hide show

app.py +26 -33

app.py CHANGED Viewed

@@ -1,12 +1,12 @@
 import gradio as gr
 from transformers import pipeline
-# --- Pipelines (already working models, unchanged) ---
 chat_model = pipeline("text-generation", model="Qwen/Qwen-1.5-0.5B-Chat", device=-1)
 caption_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base", device=-1)
 speech_model = pipeline("automatic-speech-recognition", model="openai/whisper-tiny", device=-1)
-# --- Functions ---
 def process_text(user_input):
     result = chat_model(user_input, max_new_tokens=128, do_sample=True, temperature=0.7)
     return result[0]["generated_text"]
@@ -18,51 +18,44 @@ def process_image(image):
 def process_audio(audio_path):
     transcript = speech_model(audio_path)["text"]
     reply = process_text(transcript)
-    return f"🎤 You said: **{transcript}**\n\n🤖 Assistant whispers: {reply}"
-# --- Redesigned Gradio App ---
 with gr.Blocks(theme="soft", css="""
 body {
-    background: linear-gradient(135deg, #89f7fe, #66a6ff);
-    font-family: 'Trebuchet MS', sans-serif;
 }
-#bigbox {height: 250px}
 """) as demo:
-    gr.HTML("<h1 style='text-align:center; color:white;'>✨ AssistAI Magic Tools ✨</h1>")
-    gr.Markdown("Pick a tab and enjoy some AI sorcery 🧙‍♂️\n---")
     with gr.Tab("💬 Chat Genie"):
-        gr.Markdown("Talk with your digital genie 🧞 — ask it riddles, poems, or advice!")
-        txt_in = gr.Textbox(label="Your wish ✨", lines=3, placeholder="Ask me anything...", elem_id="bigbox")
-        txt_out = gr.Textbox(label="Genie responds 🧞", lines=8)
         examples = gr.Examples(
-            examples=["Tell me a riddle", "Summarize Harry Potter in one sentence", "What's faster: a cheetah or WiFi?"],
             inputs=[txt_in]
         )
-        txt_in.submit(process_text, inputs=txt_in, outputs=txt_out)
     with gr.Tab("🖼️ Image Magic"):
-        gr.Markdown("Upload an image and let the AI describe it like a mystical mirror 🪞✨")
-        img_in = gr.Image(type="pil", label="Drop your image here 📸")
         img_out = gr.Textbox(label="AI's magical description ✨", lines=5)
-        img_in.upload(process_image, inputs=img_in, outputs=img_out)
     with gr.Tab("🎤 Voice Spell"):
-        gr.Markdown("Cast a voice spell! Speak something and see it transcribed 🪄")
-        aud_in = gr.Audio(sources=["microphone"], type="filepath", label="Click and speak into the mic 🎙️")
-        aud_out = gr.Textbox(label="Transcription + Genie reply", lines=7)
-        aud_in.change(process_audio, inputs=aud_in, outputs=aud_out)
-    with gr.Tab("🎲 Fun Extras"):
-        gr.Markdown("Some magic tricks to try instantly 🎉")
-        demo_examples = gr.Dataset(components=[gr.Textbox()], samples=[
-            ["Write a pirate poem about coding ⛵💻"],
-            ["Tell me a joke about AI 🤖😂"],
-            ["Explain infinity to a 5-year-old 🧸✨"]
-        ])
-        demo_out = gr.Textbox(label="AI Outputs", lines=7)
-        demo_examples.click(process_text, inputs=demo_examples, outputs=demo_out)
-if __name__ == "__main__":
-    demo.launch()

 import gradio as gr
 from transformers import pipeline
+# Pipelines (same as before, unchanged)
 chat_model = pipeline("text-generation", model="Qwen/Qwen-1.5-0.5B-Chat", device=-1)
 caption_model = pipeline("image-to-text", model="Salesforce/blip-image-captioning-base", device=-1)
 speech_model = pipeline("automatic-speech-recognition", model="openai/whisper-tiny", device=-1)
+# Functions (all safe and previously working)
 def process_text(user_input):
     result = chat_model(user_input, max_new_tokens=128, do_sample=True, temperature=0.7)
     return result[0]["generated_text"]
 def process_audio(audio_path):
     transcript = speech_model(audio_path)["text"]
     reply = process_text(transcript)
+    return f"🎤 You said: **{transcript}**\n\n🤖 Assistant: {reply}"
 with gr.Blocks(theme="soft", css="""
 body {
+    background: linear-gradient(135deg, #ff9a9e, #fad0c4 30%, #fad0c4 70%, #fbc2eb);
+    font-family: 'Comic Sans MS', cursive;
 }
+#chatbox {height:200px}
 """) as demo:
+    gr.HTML("<h1 style='text-align:center; color:white;'>🌈✨ AssistAI — Your Magical Multimodal Buddy ✨🌈</h1>")
+    gr.Markdown("Welcome! Try text, images, or your voice and see the magic 🧙‍♂️\n---")
     with gr.Tab("💬 Chat Genie"):
+        txt_in = gr.Textbox(label="Ask me anything 🧞", lines=3, placeholder="E.g. Tell me a riddle", elem_id="chatbox")
+        btn_chat = gr.Button("✨ Generate Reply ✨")
+        txt_out = gr.Textbox(label="Genie Responds", lines=8)
         examples = gr.Examples(
+            examples=[
+                "Tell me a riddle",
+                "Summarize Harry Potter in one sentence",
+                "What's faster: a cheetah or WiFi?",
+                "Write me a pirate poem about coding ⛵💻"
+            ],
             inputs=[txt_in]
         )
+        btn_chat.click(process_text, inputs=txt_in, outputs=txt_out)
     with gr.Tab("🖼️ Image Magic"):
+        img_in = gr.Image(type="pil", label="Upload image 🖼️")
+        btn_img = gr.Button("🪄 Generate Caption")
         img_out = gr.Textbox(label="AI's magical description ✨", lines=5)
+        btn_img.click(process_image, inputs=img_in, outputs=img_out)
     with gr.Tab("🎤 Voice Spell"):
+        aud_in = gr.Audio(sources=["microphone"], type="filepath", label="Speak your spell 🎤")
+        btn_voice = gr.Button("🔮 Transcribe + Reply")
+        aud_out = gr.Textbox(label="Transcript + Genie reply", lines=7)
+        btn_voice.click(process_audio, inputs=aud_in, outputs=aud_out)
+demo.launch()