Update app.py
Browse files
app.py
CHANGED
|
@@ -15,6 +15,11 @@ model = LatexOCR()
|
|
| 15 |
|
| 16 |
# Clean LaTeX output
|
| 17 |
def clean_latex(latex):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 18 |
# ✅ Fix invalid LaTeX escapes like \+ \- \=
|
| 19 |
latex = re.sub(r'\\([+\-=])', r'\1', latex)
|
| 20 |
|
|
@@ -56,6 +61,9 @@ def clean_latex(latex):
|
|
| 56 |
latex = latex.replace(r'\cdot', '*')
|
| 57 |
latex = latex.replace('−', '-') # Replace Unicode minus
|
| 58 |
|
|
|
|
|
|
|
|
|
|
| 59 |
# Ensure it's an equation
|
| 60 |
if '=' not in latex:
|
| 61 |
latex += '=0'
|
|
@@ -64,6 +72,7 @@ def clean_latex(latex):
|
|
| 64 |
|
| 65 |
|
| 66 |
|
|
|
|
| 67 |
# Fallback to external LLM microservice
|
| 68 |
def request_llm_fallback(bad_latex, llm_url):
|
| 69 |
pre_cleaned = re.sub(
|
|
|
|
| 15 |
|
| 16 |
# Clean LaTeX output
|
| 17 |
def clean_latex(latex):
|
| 18 |
+
# 🔧 NEW FIX: Remove bad spacing escapes and redundant slashes
|
| 19 |
+
latex = latex.replace('\\ ', '') # Remove space escapes
|
| 20 |
+
latex = latex.replace('\\\\', '\\') # Reduce double slashes
|
| 21 |
+
latex = re.sub(r'\\[ \t\n\r\f\v]*', '', latex) # Remove \ followed by whitespace or control chars
|
| 22 |
+
|
| 23 |
# ✅ Fix invalid LaTeX escapes like \+ \- \=
|
| 24 |
latex = re.sub(r'\\([+\-=])', r'\1', latex)
|
| 25 |
|
|
|
|
| 61 |
latex = latex.replace(r'\cdot', '*')
|
| 62 |
latex = latex.replace('−', '-') # Replace Unicode minus
|
| 63 |
|
| 64 |
+
# 🔧 NEW FIX: Final cleanup - remove stray characters if needed
|
| 65 |
+
latex = re.sub(r'[^\w\s^=+*\-().]', '', latex)
|
| 66 |
+
|
| 67 |
# Ensure it's an equation
|
| 68 |
if '=' not in latex:
|
| 69 |
latex += '=0'
|
|
|
|
| 72 |
|
| 73 |
|
| 74 |
|
| 75 |
+
|
| 76 |
# Fallback to external LLM microservice
|
| 77 |
def request_llm_fallback(bad_latex, llm_url):
|
| 78 |
pre_cleaned = re.sub(
|