Spaces:

Scaryscar
/

Math-charting-model

Sleeping

Scaryscar commited on Jul 27, 2025

Commit

abd6fbd

verified ·

1 Parent(s): b7d954c

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -3,45 +3,44 @@ from huggingface_hub import login
 import gradio as gr
 import os
-# Authenticate (set HF_TOKEN in Space secrets)
 login(token=os.environ.get("HF_TOKEN"))
-# Load lightweight pipeline (faster than full model load)
 math_pipeline = pipeline(
     "text-generation",
     model="google/gemma-2b-it",
     device_map="auto",
-    torch_dtype="auto",
-    model_kwargs={"load_in_4bit": True}
 )
 def solve_math(question):
-    """Super-fast response with optimized prompt"""
-    prompt = f"""Solve this math problem concisely:
-Question: {question}
-Answer:"""
     try:
         result = math_pipeline(
             prompt,
-            max_new_tokens=150,  # Shorter = faster
-            temperature=0.1,     # More deterministic
-            do_sample=False,     # Faster generation
-            num_return_sequences=1
         )
-        return result[0]['generated_text'].split("Answer:")[-1].strip()
     except Exception as e:
-        return f"🚨 Error: {str(e)}"
-# Preload pipeline
-solve_math("2+2=")  # Warm-up call
-# Minimal UI for fastest response
-with gr.Blocks(title="⚡ Instant Math Solver") as demo:
-    gr.Markdown("### Enter a math problem:")
-    question = gr.Textbox(lines=2)
-    answer = gr.Textbox(label="Answer", lines=3)
     question.submit(solve_math, question, answer)
-demo.launch(server_name="0.0.0.0")

 import gradio as gr
 import os
+# 1. First verify bitsandbytes is installed
+try:
+    import bitsandbytes  # noqa
+except ImportError:
+    raise ImportError("bitsandbytes not installed! Add it to requirements.txt")
+# 2. Authenticate
 login(token=os.environ.get("HF_TOKEN"))
+# 3. Load model WITHOUT 4-bit (for compatibility)
 math_pipeline = pipeline(
     "text-generation",
     model="google/gemma-2b-it",
     device_map="auto",
+    torch_dtype="auto",  # Let transformers choose dtype
+    model_kwargs={
+        "low_cpu_mem_usage": True  # Reduces memory spikes
+    }
 )
 def solve_math(question):
+    prompt = f"Solve concisely:\nQ: {question}\nA:"
     try:
         result = math_pipeline(
             prompt,
+            max_new_tokens=100,  # Shorter = faster
+            temperature=0.3,
+            do_sample=False  # Faster generation
         )
+        return result[0]['generated_text'].split("A:")[-1].strip()
     except Exception as e:
+        return f"Error: {str(e)}"
+# Minimal UI
+with gr.Blocks() as demo:
+    gr.Markdown("## Math Solver")
+    question = gr.Textbox(label="Problem")
+    answer = gr.Textbox(label="Solution")
     question.submit(solve_math, question, answer)
+demo.launch()