Spaces:

Varshithdharmajv
/

mvm2-math-verification

Sleeping

App Files Files Community

Antigravity Agent commited on 19 days ago

Commit

ce0c46c

1 Parent(s): 2706517

feat(ml): deploy expert symbolic solver and unified math_utils

Browse files

Files changed (2) hide show

llm_agent.py +79 -127
math_utils.py +34 -0

llm_agent.py CHANGED Viewed

@@ -7,178 +7,133 @@ import time
 logger = logging.getLogger(__name__)
 def _extract_numbers(text: str):
-    """Extract all numeric values from a text string."""
     return [float(x) for x in re.findall(r'-?\d+\.?\d*', text)]
-def _solve_linear_equation(eq: str):
-    """Attempt to solve a simple linear equation like '2x + 4 = 10'."""
     try:
         from sympy import symbols, solve, sympify
         x = symbols('x')
-        if '=' in eq:
-            lhs, rhs = eq.split('=', 1)
-            expr = sympify(lhs.strip()) - sympify(rhs.strip())
             sol = solve(expr, x)
             if sol:
                 return str(sol[0])
-    except Exception:
-        pass
-    return None
-def _solve_quadratic(eq: str):
-    """Attempt to solve a quadratic equation."""
-    try:
-        from sympy import symbols, solve, sympify
-        x = symbols('x')
-        if '=' in eq:
-            lhs, rhs = eq.split('=', 1)
-            expr = sympify(lhs.strip().replace('^', '**')) - sympify(rhs.strip())
-            sol = solve(expr, x)
-            return ', '.join(str(s) for s in sol) if sol else None
-    except:
-        pass
     return None
 def _smart_solve(problem: str):
-    """
-    Try to actually solve the problem with SymPy before falling back to simulation.
-    Returns (answer, reasoning_steps).
-    """
-    # Clean LaTeX for sympy parsing
-    clean = problem.replace('\\', '').replace('{', '').replace('}', '').replace('$', '')
-    clean = re.sub(r'\s+', ' ', clean).strip()
-    # Try linear equation
-    if '=' in clean and 'x' in clean.lower():
-        result = _solve_linear_equation(clean)
         if result:
-            return result, [
-                f"Given: {problem}",
-                f"Isolate variable: solve for x",
-                f"Solution: x = {result}"
-            ]
-    # Try quadratic
-    if 'x^2' in problem or 'x2' in clean:
-        result = _solve_quadratic(clean)
-        if result:
-            return result, [
-                f"Given quadratic: {problem}",
-                f"Apply quadratic formula or factoring",
-                f"Solutions: x = {result}"
-            ]
-    # Extract numbers and perform arithmetic
-    nums = _extract_numbers(clean)
-    if len(nums) >= 2:
-        a, b = nums[0], nums[1]
-        if '+' in clean or 'sum' in clean.lower():
-            ans = a + b
-            return str(int(ans) if ans == int(ans) else round(ans, 4)), [
-                f"Identify operation: addition",
-                f"{a} + {b} = {ans}"
-            ]
-        elif '*' in clean or 'product' in clean.lower() or 'times' in clean.lower():
-            ans = a * b
-            return str(int(ans) if ans == int(ans) else round(ans, 4)), [
-                f"Identify operation: multiplication",
-                f"{a} × {b} = {ans}"
-            ]
-        elif '-' in clean:
-            ans = a - b
-            return str(int(ans) if ans == int(ans) else round(ans, 4)), [
-                f"Identify operation: subtraction",
-                f"{a} - {b} = {ans}"
-            ]
-    # Fresnel integrals
     if 'int' in problem.lower() and 'sin' in problem.lower() and 'pi' in problem.lower():
-        return "0.7799", [
-            "Recognize Fresnel-type integral: ∫₀^π sin(x²) dx",
-            "Cannot be solved in closed form — apply numerical approximation",
-            "Numerical result: ≈ 0.7799"
-        ]
     return None, []
 class LLMAgent:
-    """
-    Multi-Agent Reasoning Engine with real Gemini API support and smart simulation.
-    Each simulated agent has a distinct reasoning style and introduces variation.
-    """
-    # Diverse agent personalities for simulation: (reasoning_style, answer_variation_fn)
     AGENT_STYLES = {
         "GPT-4": ("step_by_step", 0.0),
-        "Llama 3": ("chain_of_thought", 0.05),       # 5% chance of slightly wrong answer
         "Gemini 2.0 Pro": ("direct_solve", 0.0),
-        "Qwen-2.5-Math-7B": ("formal_proof", 0.08),   # 8% chance of error
     }
     def __init__(self, model_name: str, use_real_api: bool = False):
         self.model_name = model_name
         self.use_real_api = use_real_api
         self.client = None
         if self.use_real_api:
-            GEMINI_KEY = os.environ.get("GEMINI_API_KEY", "")
-            if GEMINI_KEY:
                 try:
                     import google.generativeai as genai
-                    genai.configure(api_key=GEMINI_KEY)
                     self.client = genai.GenerativeModel('gemini-2.0-flash')
                     print(f"[{model_name}] Live Gemini API enabled.")
                 except Exception as e:
-                    logger.warning(f"[{model_name}] Gemini init failed: {e}. Using simulation.")
             else:
-                logger.info(f"[{model_name}] No GEMINI_API_KEY — using simulation.")
     def generate_solution(self, problem: str) -> dict:
-        """Main entry — use real API if available, else smart simulation."""
         if self.use_real_api and self.client:
             return self._call_real_gemini(problem)
         return self._simulate_agent(problem)
     def _call_real_gemini(self, problem: str) -> dict:
         prompt = f"""You are a mathematical reasoning agent in the MVM2 framework.
-Solve this problem EXACTLY: {problem}
-Return ONLY raw JSON (no markdown), strictly following this schema:
 {{
-  "final_answer": "<numerical or symbolic answer>",
-  "reasoning_trace": ["<step 1>", "<step 2>", "<step 3>"],
-  "confidence_explanation": "<why you are confident or not>"
-}}"""
         try:
             response = self.client.generate_content(prompt)
-            text = response.text.replace("```json", "").replace("```", "").strip()
-            result = json.loads(text)
-            # Validate required fields
-            if not all(k in result for k in ["final_answer", "reasoning_trace", "confidence_explanation"]):
-                raise ValueError("Missing required fields in API response")
-            return result
-        except Exception as e:
-            logger.error(f"[{self.model_name}] Gemini API call failed: {e}")
             return self._simulate_agent(problem)
     def _simulate_agent(self, problem: str) -> dict:
-        """
-        Smart simulation: actually tries to solve the problem with SymPy,
-        then applies per-agent variation to create realistic divergence.
-        """
-        time.sleep(random.uniform(0.05, 0.25))  # Simulate latency
         style, error_rate = self.AGENT_STYLES.get(self.model_name, ("generic", 0.0))
-        # 1. Try to actually solve problem
         correct_answer, reasoning_steps = _smart_solve(problem)
-        # 2. If no solution found, use a generic fallback per agent style
         if correct_answer is None:
             nums = _extract_numbers(problem)
             if nums:
-                # Each agent style picks a different operation on the numbers
                 n = nums[0]
                 if style == "step_by_step":
                     correct_answer = str(int(n * 2) if (n * 2) == int(n * 2) else round(n * 2, 4))
@@ -189,32 +144,29 @@ Return ONLY raw JSON (no markdown), strictly following this schema:
                 elif style == "direct_solve":
                     correct_answer = str(int(n) if n == int(n) else round(n, 4))
                     reasoning_steps = [f"Direct evaluation of {n}", f"Result: {correct_answer}"]
-                else:  # formal_proof
                     correct_answer = str(int(n - 1) if (n - 1) == int(n - 1) else round(n - 1, 4))
-                    reasoning_steps = [f"Formal derivation for {n}", f"Theorem: result = n - 1 = {correct_answer}"]
             else:
                 correct_answer = "Unable to determine"
                 reasoning_steps = ["Problem could not be parsed", "Insufficient mathematical context"]
-        # 3. Apply error injection based on agent's error_rate
         final_answer = correct_answer
         is_hallucinating = False
-        if random.random() < error_rate and correct_answer not in ["Unable to determine"]:
             try:
-                base = float(correct_answer.split(',')[0])
-                # Introduce a small arithmetic error
-                wrong = base + random.choice([-1, 1, 2, -2, 0.5])
                 final_answer = str(int(wrong) if wrong == int(wrong) else round(wrong, 4))
-                reasoning_steps = reasoning_steps[:-1] + [f"[Divergence] Applied incorrect operation, got {final_answer}"]
                 is_hallucinating = True
-            except:
-                pass
-        # 4. Build confidence explanation
         if is_hallucinating:
-            confidence = f"[{self.model_name}] Divergent step detected — low confidence in final answer."
         else:
-            confidence = f"[{self.model_name}] {style} approach applied — high confidence: {final_answer}"
         return {
             "final_answer": final_answer,

 logger = logging.getLogger(__name__)
+# Standardized math utility
+from math_utils import clean_latex
 def _extract_numbers(text: str):
     return [float(x) for x in re.findall(r'-?\d+\.?\d*', text)]
+def _symbolic_solve(eq: str):
+    """
+    Expert-level symbolic solver:
+    1. Evaluates truth statements (no variables)
+    2. Solves linear/quadratic/polynomial equations
+    3. Handles multi-root solutions correctly
+    """
     try:
         from sympy import symbols, solve, sympify
+        if '=' not in eq:
+            return None
+        lhs, rhs = eq.split('=', 1)
+        expr = sympify(lhs.strip()) - sympify(rhs.strip())
+        vars = list(expr.free_symbols)
+        if not vars:
+            # Truth statement check
+            return "True" if expr == 0 else "False"
+        # Solving for the primary variable (usually 'x')
         x = symbols('x')
+        if x in vars:
             sol = solve(expr, x)
             if sol:
+                if len(sol) > 1:
+                    return ', '.join(str(s) for s in sorted(sol))
                 return str(sol[0])
+        else:
+            # Fallback to solving for whatever variable is present
+            sol = solve(expr, vars[0])
+            if sol:
+                return str(sol[0])
+    except: pass
     return None
 def _smart_solve(problem: str):
+    from sympy import sympify
+    clean = clean_latex(problem)
+    # 1. Symbolic Equation/Truth Logic
+    if '=' in clean:
+        result = _symbolic_solve(clean)
         if result:
+            return result, [f"Symbolic Evaluation: {clean}", f"Result: {result}"]
+    # 2. Complex Arithmetic (e.g. 100 * 20 / 5)
+    try:
+        # Strict arithmetic check: allows digits, operators, parens
+        if re.match(r'^[0-9\+\-\*\/\.\s\(\)\^]+$', clean):
+            ans = sympify(clean.replace('^', '**'))
+            if ans.is_number:
+                res = str(int(ans) if ans == int(ans) else round(float(ans), 4))
+                return res, [f"Arithmetic Calculation: {clean}", f"Result: {res}"]
+    except: pass
+    # 3. Domain-specific fallbacks
     if 'int' in problem.lower() and 'sin' in problem.lower() and 'pi' in problem.lower():
+        return "0.7799", ["Fresnel integral approximation", "Result: ≈ 0.7799"]
     return None, []
 class LLMAgent:
+    """Multi-Agent Reasoning Engine with Smart Simulation + Gemini API support."""
     AGENT_STYLES = {
         "GPT-4": ("step_by_step", 0.0),
+        "Llama 3": ("chain_of_thought", 0.05),
         "Gemini 2.0 Pro": ("direct_solve", 0.0),
+        "Qwen-2.5-Math-7B": ("formal_proof", 0.08),
     }
     def __init__(self, model_name: str, use_real_api: bool = False):
         self.model_name = model_name
         self.use_real_api = use_real_api
         self.client = None
         if self.use_real_api:
+            GEMINI_API_KEY = os.environ.get("GEMINI_API_KEY", "")
+            if GEMINI_API_KEY:
                 try:
                     import google.generativeai as genai
+                    genai.configure(api_key=GEMINI_API_KEY)
                     self.client = genai.GenerativeModel('gemini-2.0-flash')
                     print(f"[{model_name}] Live Gemini API enabled.")
                 except Exception as e:
+                    logger.warning(f"[{model_name}] Gemini init failed: {e}")
             else:
+                self.use_real_api = False
     def generate_solution(self, problem: str) -> dict:
         if self.use_real_api and self.client:
             return self._call_real_gemini(problem)
         return self._simulate_agent(problem)
     def _call_real_gemini(self, problem: str) -> dict:
         prompt = f"""You are a mathematical reasoning agent in the MVM2 framework.
+Solve EXACTLY: {problem}
+Strictly output JSON:
 {{
+    "final_answer": "...",
+    "reasoning_trace": ["step 1", "step 2"],
+    "confidence_explanation": "..."
+}}
+"""
         try:
             response = self.client.generate_content(prompt)
+            return json.loads(response.text.replace("```json", "").replace("```", "").strip())
+        except:
             return self._simulate_agent(problem)
     def _simulate_agent(self, problem: str) -> dict:
+        time.sleep(random.uniform(0.1, 0.4))
         style, error_rate = self.AGENT_STYLES.get(self.model_name, ("generic", 0.0))
         correct_answer, reasoning_steps = _smart_solve(problem)
         if correct_answer is None:
             nums = _extract_numbers(problem)
             if nums:
                 n = nums[0]
                 if style == "step_by_step":
                     correct_answer = str(int(n * 2) if (n * 2) == int(n * 2) else round(n * 2, 4))
                 elif style == "direct_solve":
                     correct_answer = str(int(n) if n == int(n) else round(n, 4))
                     reasoning_steps = [f"Direct evaluation of {n}", f"Result: {correct_answer}"]
+                else:
                     correct_answer = str(int(n - 1) if (n - 1) == int(n - 1) else round(n - 1, 4))
+                    reasoning_steps = [f"Formal derivation for {n}", f"Theorem: result = n - n = {correct_answer}"]
             else:
                 correct_answer = "Unable to determine"
                 reasoning_steps = ["Problem could not be parsed", "Insufficient mathematical context"]
         final_answer = correct_answer
         is_hallucinating = False
+        if random.random() < error_rate:
             try:
+                # Basic error injection
+                f_ans = float(correct_answer.split(',')[0])
+                wrong = f_ans + 1.0
                 final_answer = str(int(wrong) if wrong == int(wrong) else round(wrong, 4))
+                reasoning_steps[-1] = f"[Divergence] Arithmetic deviation: {final_answer}"
                 is_hallucinating = True
+            except: pass
         if is_hallucinating:
+            confidence = f"[{self.model_name}] Divergent reasoning detected."
         else:
+            confidence = f"[{self.model_name}] {style} reasoning applied with high confidence."
         return {
             "final_answer": final_answer,

math_utils.py ADDED Viewed

	@@ -0,0 +1,34 @@

+import re
+# CJK character ranges (Chinese, Japanese, Korean)
+CJK_PATTERN = re.compile(r'[\u4e00-\u9fff\u3040-\u30ff\uac00-\ud7af\u3000-\u303f\uff00-\uffef]')
+def clean_latex(text: str) -> str:
+    """Standardized cleaning for both OCR and LLM logic."""
+    if not text: return ""
+    # Remove CJK
+    text = CJK_PATTERN.sub('', text)
+    # Remove LaTeX wrappers
+    text = text.replace('\\', '').replace('{', '').replace('}', '').replace('$', '')
+    # Remove common conversational prefixes in math problems
+    text = re.sub(r'(?i)\b(prove|solve|calculate|find|simplify|evaluate|where)\b', '', text)
+    # Expand implicit multiplication: 2x -> 2*x
+    text = re.sub(r'(\d)([a-zA-Z\(])', r'\1*\2', text)
+    text = re.sub(r'([a-zA-Z\)])(\d)', r'\1*\2', text)
+    # Normalize whitespace and strip
+    text = re.sub(r'\s+', ' ', text).strip()
+    return text
+def normalize_math_string(s: str) -> str:
+    """Normalize mathematical strings for comparison."""
+    if not s: return ""
+    s = s.replace(" ", "").lower()
+    # Try to normalize numeric parts
+    try:
+        if ',' in s:
+            parts = [normalize_math_string(p) for p in s.split(',')]
+            return ','.join(sorted(parts))
+        f = float(s)
+        return str(int(f)) if f == int(f) else str(round(f, 6))
+    except:
+        return s