Spaces:

Scaryscar
/

Math-charting-model

Sleeping

App Files Files Community

Scaryscar commited on Jul 27, 2025

Commit

bba9bff

verified ·

1 Parent(s): 85e915a

Update app.py

Browse files

Files changed (1) hide show

app.py +49 -31

app.py CHANGED Viewed

@@ -1,44 +1,62 @@
-from transformers import pipeline
-import gradio as gr
 import torch
-# Verify GPU
 if not torch.cuda.is_available():
-    raise RuntimeError("Enable GPU in Space settings")
-# Load model (without bitsandbytes)
-model = pipeline(
     "text-generation",
-    model="google/gemma-2b-it",
-    device=0,  # Force GPU
-    torch_dtype=torch.float16,
-    model_kwargs={
-        "low_cpu_mem_usage": True,
-        "trust_remote_code": True
-    }
 )
-def solve_math(question):
-    prompt = f"Solve step by step:\nQ: {question}\nA:"
     try:
-        result = model(
             prompt,
-            max_new_tokens=100,
-            temperature=0.3,
-            do_sample=False
         )
-        return result[0]['generated_text'].split("A:")[-1].strip()
     except Exception as e:
-        return f"Error: {str(e)}"
-# Preload
-solve_math("2+2=")
-# Simple UI
-with gr.Blocks() as demo:
-    gr.Markdown("## Math Solver")
-    question = gr.Textbox(label="Problem")
-    answer = gr.Textbox(label="Solution")
-    question.submit(solve_math, question, answer)
-demo.launch()

+from transformers import AutoModelForCausalLM, AutoTokenizer, pipeline
 import torch
+import gradio as gr
+import os
+# 1. GPU Verification
 if not torch.cuda.is_available():
+    raise RuntimeError("❌ GPU not detected! Enable GPU in Space settings.")
+print(f"✅ Using GPU: {torch.cuda.get_device_name(0)}")
+# 2. Model Configuration
+MODEL_NAME = "google/gemma-2b-it"  # Try "mistralai/Mistral-7B-v0.1" for more power
+# 3. Load Model with GPU Optimization
+tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
+model = AutoModelForCausalLM.from_pretrained(
+    MODEL_NAME,
+    device_map="auto",          # Auto-selects GPU
+    torch_dtype=torch.float16,  # Half-precision for memory
+    low_cpu_mem_usage=True      # Reduces CPU overhead
+)
+# 4. Create GPU-accelerated pipeline
+pipe = pipeline(
     "text-generation",
+    model=model,
+    tokenizer=tokenizer,
+    device=0,                  # Force first GPU
+    torch_dtype=torch.float16
 )
+# 5. Generation Function
+def generate_text(prompt):
     try:
+        outputs = pipe(
             prompt,
+            max_new_tokens=150,
+            temperature=0.7,
+            do_sample=True,
+            pad_token_id=tokenizer.eos_token_id
         )
+        return outputs[0]['generated_text']
     except Exception as e:
+        return f"⚠️ Error: {str(e)}"
+# 6. Gradio Interface
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("## 🚀 GPU-Powered Text Generator")
+    with gr.Row():
+        inp = gr.Textbox(label="Your Prompt", placeholder="Type here...")
+    with gr.Row():
+        out = gr.Textbox(label="Generated Text", lines=5)
+    with gr.Row():
+        btn = gr.Button("Generate", variant="primary")
+    btn.click(fn=generate_text, inputs=inp, outputs=out)
+    inp.submit(fn=generate_text, inputs=inp, outputs=out)
+# 7. Launch with GPU monitoring
+if __name__ == "__main__":
+    print(f"GPU Memory Allocated: {torch.cuda.memory_allocated()/1e9:.2f} GB")
+    demo.launch(server_name="0.0.0.0")