Spaces:

Scaryscar
/

Maths-charting-model

Runtime error

App Files Files Community

Scaryscar commited on Jul 26, 2025

Commit

6035c2a

verified ·

1 Parent(s): 2f2f576

Update app.py

Browse files

Files changed (1) hide show

app.py +69 -28

app.py CHANGED Viewed

@@ -1,47 +1,88 @@
-from transformers import pipeline, AutoModelForCausalLM, AutoTokenizer
-import gradio as gr
 import torch
-# Load WizardMath (adjust model size if needed)
-model_name = "WizardLM/WizardMath-7B-V1.1"  # Smaller: "WizardLM/WizardMath-70B-V1.0"
-tokenizer = AutoTokenizer.from_pretrained(model_name)
 model = AutoModelForCausalLM.from_pretrained(
-    model_name,
-    torch_dtype=torch.float16,  # Reduce memory usage
-    device_map="auto"  # Auto-select GPU/CPU
 )
-def solve_math_problem(question):
-    # Format input for WizardMath
-    prompt = f"USER: Solve this math problem: {question}\nASSISTANT:"
-    # Generate response
-    inputs = tokenizer(prompt, return_tensors="pt").to(model.device)
-    outputs = model.generate(
-        inputs.input_ids,
         max_new_tokens=256,
         pad_token_id=tokenizer.eos_token_id
     )
-    # Decode and clean output
-    answer = tokenizer.decode(outputs[0], skip_special_tokens=True)
-    answer = answer.split("ASSISTANT:")[-1].strip()  # Extract the answer part
     return answer
 # Gradio Interface
 demo = gr.Interface(
-    fn=solve_math_problem,
-    inputs=gr.Textbox(lines=2, placeholder="Enter your math problem here..."),
-    outputs=gr.Textbox(label="Solution"),
-    title="🧙 WizardMath Problem Solver",
     examples=[
-        ["What is the integral of x^2 from 0 to 3?"],
-        ["Solve for x: 2x + 5 = 15"],
-        ["Calculate the area of a circle with radius 4."]
     ],
-    theme="soft"  # Try "default" or "huggingface"
 )
 if __name__ == "__main__":
-    demo.launch(server_port=7860, share=False)  # Set share=True for public link

+from transformers import (
+    AutoModelForCausalLM,
+    AutoTokenizer,
+    BitsAndBytesConfig,
+    pipeline
+)
 import torch
+import gradio as gr
+# Configuration
+MODEL_NAME = "WizardLM/WizardMath-7B-V1.1"  # Use 7B model for Spaces
+CACHE_DIR = "/tmp"  # For Spaces limited storage
+# 4-bit quantization setup
+quant_config = BitsAndBytesConfig(
+    load_in_4bit=True,
+    bnb_4bit_quant_type="nf4",
+    bnb_4bit_compute_dtype=torch.float16,
+    bnb_4bit_use_double_quant=True
+)
+# Load model with optimizations
+tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, cache_dir=CACHE_DIR)
 model = AutoModelForCausalLM.from_pretrained(
+    MODEL_NAME,
+    quantization_config=quant_config,
+    device_map="auto",
+    cache_dir=CACHE_DIR,
+    trust_remote_code=True
+)
+# Create a text generation pipeline
+math_pipeline = pipeline(
+    "text-generation",
+    model=model,
+    tokenizer=tokenizer,
+    torch_dtype=torch.float16,
+    device_map="auto"
 )
+def solve_math(question):
+    prompt = f"USER: {question}\nASSISTANT:"
+    # Generate response with adjusted parameters
+    outputs = math_pipeline(
+        prompt,
         max_new_tokens=256,
+        do_sample=True,
+        temperature=0.7,
+        top_k=50,
+        top_p=0.95,
         pad_token_id=tokenizer.eos_token_id
     )
+    # Extract and clean the answer
+    full_response = outputs[0]["generated_text"]
+    answer = full_response.split("ASSISTANT:")[-1].strip()
     return answer
 # Gradio Interface
 demo = gr.Interface(
+    fn=solve_math,
+    inputs=gr.Textbox(
+        label="Math Problem",
+        placeholder="Enter your math question here...",
+        lines=3
+    ),
+    outputs=gr.Textbox(
+        label="Solution",
+        lines=5
+    ),
+    title="🧮 WizardMath Solver",
+    description="Solves math problems using WizardMath-7B (4-bit quantized)",
     examples=[
+        ["What is 2^10 + 5*3?"],
+        ["Solve for x: 3x + 7 = 22"],
+        ["Calculate the area of a circle with radius 5"]
     ],
+    allow_flagging="never"
 )
+# Launch with Space-optimized settings
 if __name__ == "__main__":
+    demo.launch(
+        server_name="0.0.0.0",
+        server_port=7860,
+        share=False  # Set to True for public link during testing
+    )