Spaces:

Genie-AI-Lab
/

Genie-AI

Runtime error

Genie-AI-Lab commited on Oct 29, 2025

Commit

f37a8c9

verified ·

1 Parent(s): 4674efd

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,6 +1,22 @@
 import gradio as gr
-def chat(message):
-    return "Test response: " + message
 gr.ChatInterface(chat).launch()

 import gradio as gr
+from huggingface_hub import hf_hub_download
+import subprocess
+import os
+# Download our GGUF model
+model_path = hf_hub_download(
+    repo_id="Genie-AI-Lab/Omni-Genie",
+    filename="Qwen2.5-3B-Instruct.Q4_0.gguf"
+)
+def chat(message, history):
+    # Use llama.cpp to run inference on our model
+    result = subprocess.run([
+        "python", "-m", "llama_cpp.server",
+        "--model", model_path,
+        "--n_ctx", "2048"
+    ], input=message.encode(), capture_output=True)
+    return result.stdout.decode()
 gr.ChatInterface(chat).launch()