Spaces:

st192011
/

Bitnet-Socratic-1-Bit

Running

App Files Files Community

st192011 commited on 7 days ago

Commit

6f7a25d

verified ·

1 Parent(s): 0aa64c9

Create app.py

Browse files

Files changed (1) hide show

app.py +68 -0

app.py ADDED Viewed

	@@ -0,0 +1,68 @@

+import gradio as gr
+import subprocess
+import os
+SYSTEM_INSTRUCTION = (
+    "You are a Socratic assistant. Do not answer questions directly. "
+    "Instead, respond exclusively with 3 deep, reflective questions. "
+    "Then generate stop token"
+)
+MODEL_PATH = "models/BitNet-b1.58-2B-4T/ggml-model-i2_s.gguf"
+def clean_socratic_output(raw_stdout, full_prompt):
+    generated_text = raw_stdout.replace(full_prompt, "").strip()
+    stop_markers = ["Stop token", "stop token", "Stop.", "stop.", "Response:", "Response"]
+    lowest_index = len(generated_text)
+    marker_found = False
+    for marker in stop_markers:
+        idx = generated_text.find(marker)
+        if idx != -1 and idx < lowest_index:
+            lowest_index = idx
+            marker_found = True
+    if marker_found:
+        generated_text = generated_text[:lowest_index].strip()
+    if generated_text.endswith(("\n4.", "\n4", "4.", "4")):
+        generated_text = generated_text.rsplit("\n4", 1)[0].strip()
+    return generated_text
+def socratic_chat(user_query):
+    if not user_query.strip():
+        return "Please enter a valid question."
+    formatted_chat_prompt = f"System: {SYSTEM_INSTRUCTION}\nUser: {user_query}\nAssistant:"
+    cmd = [
+        "python3", "run_inference.py",
+        "-m", MODEL_PATH,
+        "-p", formatted_chat_prompt,
+        "-n", "100",
+        "-temp", "0.4",
+        "-t", "2"  # Matches HF Space 2-vCPU hardware allocation
+    ]
+    execution_result = subprocess.run(cmd, capture_output=True, text=True)
+    if execution_result.stdout:
+        return clean_socratic_output(execution_result.stdout, formatted_chat_prompt)
+    else:
+        return f"Error running model: {execution_result.stderr}"
+# Build the Gradio UI Layout
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🧠 1-Bit Local Socratic Assistant")
+    gr.Markdown("This interface is running an official Microsoft BitNet 1.58-bit model on an optimized CPU backend.")
+    with gr.Row():
+        with gr.Column():
+            input_text = gr.Textbox(label="What concept are you exploring?", placeholder="e.g., What is justice?")
+            submit_btn = gr.Button("Generate Socratic Reflection", variant="primary")
+        with gr.Column():
+            output_text = gr.Textbox(label="Socratic Feedback", lines=6)
+    submit_btn.click(fn=socratic_chat, inputs=input_text, outputs=output_text)
+    input_text.submit(fn=socratic_chat, inputs=input_text, outputs=output_text)
+if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=7860)