Spaces:

Hulk810154
/

Testkai

Sleeping

App Files Files Community

Hulk810154 commited on Jul 10, 2025

Commit

20b9745

verified ·

1 Parent(s): 58e1f7c

Update app.py

Browse files

Files changed (1) hide show

app.py +33 -25

app.py CHANGED Viewed

@@ -1,62 +1,70 @@
 import gradio as gr
 from transformers import pipeline
-# ——— Load Pipelines ———
 chat_pipe = pipeline(
     "text-generation",
     model="Hulk810154/Kai",
     trust_remote_code=True
-)
 asr_pipe = pipeline(
     "automatic-speech-recognition",
     model="openai/whisper-tiny"
-)
-# ——— Handlers ———
 def chat_fn(message, history):
-    prompt = ""
-    for u, b in history:
-        prompt += f"User: {u}\nAI: {b}\n"
     prompt += f"User: {message}\nAI:"
     out = chat_pipe(prompt, max_length=256, do_sample=True)
     reply = out[0]["generated_text"][len(prompt):].strip()
     history.append((message, reply))
     return history, history
-def speech_to_text(audio_path):
-    if not audio_path:
         return ""
-    return asr_pipe(audio_path)["text"]
 def handle_upload(files):
-    return f"Received {len(files)} file(s): " + ", ".join([f.name for f in files])
-# ——— UI ———
-with gr.Blocks() as demo:
-    gr.Markdown("# 🧠 Kai AGI Chat\n**Type, Speak or Upload — true multimodal AGI.**")
-    state = gr.State([])
     with gr.Row():
         with gr.Column():
-            chatbot = gr.Chatbot(label="Conversation")
-            txt = gr.Textbox(placeholder="Type here…", label="Text Input")
-            mic = gr.Audio(source="microphone", type="filepath", label="🎤 Voice Input")
-            send = gr.Button("Send")
         with gr.Column():
             uploader = gr.File(file_count="multiple", label="📎 Upload Files/Images")
             upload_status = gr.Textbox(label="Upload Status")
-    # Wire it up
-    send.click(
-        lambda txt, mic, history: ( speech_to_text(mic) or txt, history ),
-        inputs=[txt, mic, state],
-        outputs=[txt, state]
     ).then(
         chat_fn,
-        inputs=[txt, state],
         outputs=[chatbot, state]
     )
     uploader.upload(handle_upload, inputs=uploader, outputs=upload_status)
 demo.launch()

 import gradio as gr
 from transformers import pipeline
+# ——— Load models ———
 chat_pipe = pipeline(
     "text-generation",
     model="Hulk810154/Kai",
     trust_remote_code=True
+)  # Text generation 6
 asr_pipe = pipeline(
     "automatic-speech-recognition",
     model="openai/whisper-tiny"
+)  # Whisper Tiny for STT 7
+# ——— Core handlers ———
 def chat_fn(message, history):
+    """Generate reply given message + history."""
+    prompt = "".join(f"User: {u}\nAI: {b}\n" for u, b in history)
     prompt += f"User: {message}\nAI:"
     out = chat_pipe(prompt, max_length=256, do_sample=True)
     reply = out[0]["generated_text"][len(prompt):].strip()
     history.append((message, reply))
     return history, history
+def transcribe(audio):
+    """Turn recorded audio into text."""
+    if audio is None:
         return ""
+    # gr.Audio returns (array, sampling_rate) by default 8
+    if isinstance(audio, (tuple, list)) and len(audio) == 2:
+        arr, sr = audio
+        return asr_pipe({"array": arr, "sampling_rate": sr})["text"]
+    # Or accept a filepath
+    return asr_pipe(audio)["text"]
 def handle_upload(files):
+    """Report uploaded files/images."""
+    return f"Received {len(files)} file(s): " + ", ".join(f.name for f in files)
+# ——— Build UI ———
+with gr.Blocks() as demo:  # Low-level Blocks API 9
+    gr.Markdown("# 🧠 Kai AGI Chat\n_Chat via text, voice, or upload — true multimodal AGI_")
+    state = gr.State([])  # Session memory
     with gr.Row():
         with gr.Column():
+            chatbot = gr.Chatbot(type="messages", label="Conversation")  # Future-proof format 10
+            txt_input = gr.Textbox(placeholder="Type here…", label="Text Input")
+            mic_input = gr.Audio(label="🎤 Voice Input")  # Browser mic/upload 11
+            send_btn = gr.Button("Send")
         with gr.Column():
             uploader = gr.File(file_count="multiple", label="📎 Upload Files/Images")
             upload_status = gr.Textbox(label="Upload Status")
+    # Text or voice → chat
+    send_btn.click(
+        lambda txt, mic, hist: (transcribe(mic) or txt, hist),
+        inputs=[txt_input, mic_input, state],
+        outputs=[txt_input, state]
     ).then(
         chat_fn,
+        inputs=[txt_input, state],
         outputs=[chatbot, state]
     )
+    # Handle uploads
     uploader.upload(handle_upload, inputs=uploader, outputs=upload_status)
 demo.launch()