Spaces:

syk101
/

texlab

Runtime error

File size: 15,080 Bytes

d05a9d0

import os
import base64
import tempfile
import json
from flask import Blueprint, request, jsonify, current_app
from werkzeug.utils import secure_filename
import fitz  # PyMuPDF
import PyPDF2
from PIL import Image
from io import BytesIO
import cv2
import numpy as np

# Import the existing Pix2Text functionality
try:
    from pix2text import Pix2Text
    p2t = Pix2Text(analyzer_config=dict(model_name='mfd'))
except Exception as e:
    print(f"Warning: Could not initialize Pix2Text: {e}")
    p2t = None

# Import utility functions from other controllers
from controller.pix2text_controller import preprocess_image as preprocess_math_image
from controller.scribble_controller import preprocess_image as preprocess_scribble_image
from controller.pdf_controller import extract_text_from_pdf
from controller.table_controller import detect_table, generate_latex_table

chatbot_bp = Blueprint('chatbot_bp', __name__, url_prefix='/chatbot')

UPLOAD_FOLDER = 'static/uploads'
PROCESSED_FOLDER = 'static/processed'
os.makedirs(UPLOAD_FOLDER, exist_ok=True)
os.makedirs(PROCESSED_FOLDER, exist_ok=True)

def allowed_file(filename):
    """Check if file extension is allowed"""
    ALLOWED_EXTENSIONS = {'png', 'jpg', 'jpeg', 'pdf'}
    return '.' in filename and filename.rsplit('.', 1)[1].lower() in ALLOWED_EXTENSIONS

def is_table_image(image_path):
    """Check if the image is likely a table"""
    try:
        # Use the existing table detection logic
        rows, cols = detect_table(image_path)
        # If we detect at least 2 rows and 2 columns, it's likely a table
        return rows >= 2 and cols >= 2
    except Exception as e:
        print(f"Error detecting table: {e}")
        return False

def process_table_image(image_path):
    """Process table image and convert to LaTeX table"""
    try:
        # Detect table structure
        rows, cols = detect_table(image_path)
        
        # Generate LaTeX table code
        if rows > 0 and cols > 0:
            latex_code = generate_latex_table(rows, cols)
            return latex_code
        else:
            return "\\text{Could not detect table structure}"
    except Exception as e:
        print(f"Error processing table image: {e}")
        return f"\\text{{Error processing table: {str(e)}}}"

def process_math_image(image_path):
    """Process math image and convert to LaTeX using Pix2Text"""
    try:
        if p2t:
            # Try with original image first
            result = p2t.recognize(image_path)
            
            # Handle different result types
            if isinstance(result, dict):
                latex_code = result.get('text', '')
            elif isinstance(result, list):
                # If result is a list, extract text from first item
                if result and isinstance(result[0], dict):
                    latex_code = result[0].get('text', '')
                else:
                    latex_code = str(result)
            else:
                latex_code = str(result)
            
            # If we get no result or very short result, try with preprocessing
            if len(latex_code.strip()) < 2:
                print("Result too short, trying with preprocessing...")
                processed_path = preprocess_math_image(image_path)
                result = p2t.recognize(processed_path)
                
                if isinstance(result, dict):
                    latex_code = result.get('text', '')
                elif isinstance(result, list):
                    if result and isinstance(result[0], dict):
                        latex_code = result[0].get('text', '')
                    else:
                        latex_code = str(result)
                else:
                    latex_code = str(result)
            
            return latex_code
        else:
            return "\\text{Pix2Text not available}"
    except Exception as e:
        print(f"Error processing math image: {e}")
        return f"\\text{{Error processing math image: {str(e)}}}"

def process_image_for_latex(image_path):
    """Process image and convert to LaTeX, detecting if it's a table or math"""
    try:
        # First, check if it's a table
        if is_table_image(image_path):
            print("Detected table image, processing as table...")
            return process_table_image(image_path)
        else:
            print("Processing as math equation...")
            return process_math_image(image_path)
    except Exception as e:
        print(f"Error processing image: {e}")
        # Fallback to math processing
        return process_math_image(image_path)

def process_pdf_for_latex(pdf_path):
    """Process PDF and extract LaTeX with better math equation handling"""
    try:
        # Extract text from PDF
        text = extract_text_from_pdf(pdf_path)
        
        # Enhanced conversion to LaTeX with better math handling
        # Escape backslashes but preserve LaTeX commands
        latex = text.replace('\\', '\\textbackslash ')
        
        # Handle common math symbols and expressions
        math_replacements = {
            '∑': '\\sum',
            '∏': '\\prod',
            '∫': '\\int',
            '∞': '\\infty',
            '±': '\\pm',
            '×': '\\times',
            '÷': '\\div',
            '≤': '\\leq',
            '≥': '\\geq',
            '≠': '\\neq',
            '≈': '\\approx',
            '√': '\\sqrt',
            'α': '\\alpha',
            'β': '\\beta',
            'γ': '\\gamma',
            'δ': '\\delta',
            'ε': '\\epsilon',
            'θ': '\\theta',
            'λ': '\\lambda',
            'μ': '\\mu',
            'π': '\\pi',
            'σ': '\\sigma',
            'φ': '\\phi',
            'ω': '\\omega',
        }
        
        for symbol, replacement in math_replacements.items():
            latex = latex.replace(symbol, replacement)
        
        # Handle subscripts and superscripts (simple cases)
        import re
        # Replace simple subscripts like x1, x2 with x_1, x_2
        latex = re.sub(r'([a-zA-Z])(\d+)', r'\1_\2', latex)
        
        # Handle fractions in the form a/b
        latex = re.sub(r'(\d+)/(\d+)', r'\\frac{\1}{\2}', latex)
        
        # Add basic escaping for special LaTeX characters
        latex = latex.replace('_', '\\_').replace('^', '\\^').replace('&', '\\&')
        latex = latex.replace('%', '\\%').replace('$', '\\$').replace('#', '\\#')
        latex = latex.replace('{', '\\{').replace('}', '\\}')
        
        # Restore LaTeX commands by unescaping them
        latex = latex.replace('\\textbackslash ', '\\')
        
        # Try to detect and format mathematical expressions
        # Look for patterns that indicate mathematical content
        latex = re.sub(r'(\d+)x(\d+)', r'\1 \\times \2', latex)  # Handle multiplication
        latex = re.sub(r'(\d+)\^(\d+)', r'\1^\2', latex)  # Handle exponents
        
        return latex
    except Exception as e:
        print(f"Error processing PDF: {e}")
        return f"\\text{{Error processing PDF: {str(e)}}}"

@chatbot_bp.route('/chat', methods=['POST'])
def chat():
    """Enhanced chat endpoint that handles text, image, and PDF inputs"""
    try:
        # Handle file upload (image or PDF)
        if 'image' in request.files or 'pdf' in request.files:
            file = request.files.get('image') or request.files.get('pdf')
            
            if file and file.filename != '':
                if allowed_file(file.filename):
                    try:
                        # Secure filename
                        filename = secure_filename(file.filename)
                        # Add unique identifier to prevent conflicts
                        name, ext = os.path.splitext(filename)
                        unique_filename = f"{name}_{os.urandom(8).hex()}{ext}"
                        
                        # Save file
                        filepath = os.path.join(UPLOAD_FOLDER, unique_filename)
                        file.save(filepath)
                        
                        # Process based on file type
                        if ext.lower() in ['.png', '.jpg', '.jpeg']:
                            # Process image for LaTeX
                            latex_result = process_image_for_latex(filepath)
                            
                            # Determine if it was processed as a table or math
                            if "begin{tabular}" in latex_result:
                                file_type_desc = "table"
                            else:
                                file_type_desc = "math equation"
                            
                            return jsonify({
                                'success': True,
                                'response': f"I've processed your image as a {file_type_desc} and converted it to LaTeX:\n\n```\n{latex_result}\n```\n\nYou can copy this LaTeX code and use it in your documents.",
                                'latex': latex_result,
                                'file_type': 'image'
                            })
                        elif ext.lower() == '.pdf':
                            # Process PDF for LaTeX
                            latex_result = process_pdf_for_latex(filepath)
                            
                            return jsonify({
                                'success': True,
                                'response': f"I've processed your PDF and extracted the mathematical content in LaTeX format:\n\n```\n{latex_result}\n```\n\nYou can copy this LaTeX code and use it in your documents.",
                                'latex': latex_result,
                                'file_type': 'pdf'
                            })
                        else:
                            return jsonify({
                                'success': False,
                                'response': "Unsupported file type. Please upload an image (PNG, JPG, JPEG) or PDF file."
                            }), 400
                    except Exception as e:
                        return jsonify({
                            'success': False,
                            'response': f"Error processing file: {str(e)}"
                        }), 500
                else:
                    return jsonify({
                        'success': False,
                        'response': "Invalid file type. Please upload an image (PNG, JPG, JPEG) or PDF file."
                    }), 400
        
        # Handle JSON data (text messages)
        elif request.is_json:
            data = request.get_json()
            message = data.get('message', '')
            
            # Handle text message
            if message:
                # Generate response based on user input (existing functionality)
                lower_message = message.lower()
                
                if 'fraction' in lower_message or 'frac' in lower_message:
                    response = 'To write a fraction in LaTeX, use \\frac{numerator}{denominator}. For example: \\frac{1}{2} produces ½.'
                elif 'integral' in lower_message or 'int' in lower_message:
                    response = 'To write an integral in LaTeX, use \\int. For example: \\int_0^1 x^2 dx. For definite integrals, specify limits with _ and ^.'
                elif 'sum' in lower_message or 'sigma' in lower_message:
                    response = 'To write a summation in LaTeX, use \\sum. For example: \\sum_{i=1}^{n} i. Use _ for lower limit and ^ for upper limit.'
                elif 'limit' in lower_message or 'lim' in lower_message:
                    response = 'To write a limit in LaTeX, use \\lim. For example: \\lim_{x \\to 0} \\frac{\\sin x}{x} = 1.'
                elif 'matrix' in lower_message or 'array' in lower_message:
                    response = 'To create a matrix in LaTeX, use \\begin{matrix} ... \\end{matrix}. For example:\n\\begin{matrix}\na & b \\\\\nc & d\n\\end{matrix}'
                elif 'table' in lower_message or 'tabular' in lower_message:
                    response = 'To create a table in LaTeX, use the tabular environment. For example:\n\\begin{tabular}{|c|c|}\n\\hline\nColumn 1 & Column 2 \\\\\n\\hline\nItem 1 & Item 2 \\\\\n\\hline\n\\end{tabular}'
                elif 'equation' in lower_message or 'align' in lower_message:
                    response = 'To write equations in LaTeX, you can use:\n- Inline: $E = mc^2$\n- Display: $$E = mc^2$$\n- Aligned: \\begin{align} x &= y \\\\ y &= z \\end{align}'
                elif 'help' in lower_message or 'texlab' in lower_message:
                    response = "I'm the TexLab Assistant! I can help you with:\n- LaTeX syntax and commands\n- Mathematical notation\n- Document conversion tips\n- Using TexLab features\n\nJust ask me any LaTeX or math question!"
                elif 'image' in lower_message or 'picture' in lower_message or 'photo' in lower_message:
                    response = "You can upload images of math equations or tables by clicking the 'Image' button in the chat interface. I'll convert them to LaTeX code for you!"
                elif 'pdf' in lower_message or 'document' in lower_message:
                    response = "You can upload PDF files by clicking the 'PDF' button in the chat interface. I'll extract the content and convert it to LaTeX format!"
                else:
                    # Default response
                    response = "I'm the TexLab Assistant. I can help you with LaTeX syntax, mathematical notation, and document conversion.\n\n✨ New Features:\n• Upload images of math equations or tables for LaTeX conversion\n• Upload PDF files for content extraction\n\nTry asking me something like 'How do I write a fraction in LaTeX?' or 'How do I create a matrix?', or upload an image/PDF file!"
                
                return jsonify({
                    'success': True,
                    'response': response
                })
            
            # No valid input
            else:
                return jsonify({
                    'success': False,
                    'response': "Please provide a message, image, or PDF file to process."
                }), 400
        
        # No valid input
        else:
            return jsonify({
                'success': False,
                'response': "Please provide a message, image, or PDF file to process."
            }), 400
            
    except Exception as e:
        print(f"Error in chat endpoint: {e}")
        return jsonify({
            'success': False,
            'response': "Sorry, I encountered an error processing your request. Please try again."
        }), 500