Spaces:

Varshithdharmajv
/

mvm2-math-verification

Sleeping

App Files Files Community

Varshithdharmajv commited on 23 days ago

Commit

dbd32c5

verified ·

1 Parent(s): 99f7550

Upload handwriting_transcriber.py with huggingface_hub

Browse files

Files changed (1) hide show

handwriting_transcriber.py +155 -0

handwriting_transcriber.py ADDED Viewed

	@@ -0,0 +1,155 @@

+"""
+Handwriting Transcriber Module
+Wrapper for handwritten-math-transcription repository
+"""
+import sys
+import os
+import torch
+from typing import Optional, Tuple
+# Add handwritten-math-transcription to path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..', 'handwritten-math-transcription'))
+try:
+    from model import Encoder, Decoder, Seq2Seq
+    from dataset.hme_ink import read_inkml_file
+    from utils import tokenize_latex
+    from corrector import correct_latex
+    from config import *
+except ImportError:
+    Encoder = None
+    Decoder = None
+    Seq2Seq = None
+    read_inkml_file = None
+    tokenize_latex = None
+    correct_latex = None
+class HandwritingTranscriber:
+    """
+    Handwriting transcriber for mathematical expressions.
+    Converts handwritten math (InkML format) to LaTeX.
+    """
+    def __init__(self,
+                 model_path: str = None,
+                 device: str = None,
+                 use_corrector: bool = True):
+        """
+        Initialize handwriting transcriber.
+        Args:
+            model_path: Path to trained model checkpoint
+            device: Device to run model on ('cpu', 'cuda', 'mps')
+            use_corrector: Whether to use LLM corrector for post-processing
+        """
+        self.device = device or ('cuda' if torch.cuda.is_available() else 'cpu')
+        self.use_corrector = use_corrector
+        self.model = None
+        self.model_path = model_path
+        if model_path and os.path.exists(model_path):
+            self.load_model(model_path)
+    def load_model(self, model_path: str):
+        """
+        Load trained model from checkpoint.
+        Args:
+            model_path: Path to model checkpoint
+        """
+        if Seq2Seq is None:
+            raise ImportError("Handwriting transcription model not available")
+        try:
+            # Model architecture parameters (from config or defaults)
+            input_dim = 11
+            enc_hidden_dim = 256
+            dec_hidden_dim = 256
+            embed_dim = 128
+            output_dim = LATEX_VOCAB_SIZE if 'LATEX_VOCAB_SIZE' in globals() else 300
+            encoder_num_layers = 2
+            decoder_num_layers = 2
+            # Create model
+            encoder = Encoder(input_dim, enc_hidden_dim,
+                            num_layers=encoder_num_layers, bidirectional=True)
+            decoder = Decoder(output_dim, embed_dim,
+                            enc_hidden_dim, dec_hidden_dim,
+                            num_layers=decoder_num_layers)
+            self.model = Seq2Seq(encoder, decoder, self.device).to(self.device)
+            # Load weights
+            checkpoint = torch.load(model_path, map_location=self.device)
+            self.model.load_state_dict(checkpoint)
+            self.model.eval()
+            print(f"Model loaded from {model_path}")
+        except Exception as e:
+            print(f"Error loading model: {e}")
+            self.model = None
+    def transcribe_inkml(self, inkml_path: str) -> Tuple[str, str]:
+        """
+        Transcribe an InkML file to LaTeX.
+        Args:
+            inkml_path: Path to InkML file
+        Returns:
+            Tuple of (predicted_latex, ground_truth_latex if available)
+        """
+        if self.model is None:
+            raise ValueError("Model not loaded. Please load a model first.")
+        if read_inkml_file is None:
+            raise ImportError("InkML reading functionality not available")
+        try:
+            # Read InkML file
+            strokes, ground_truth = read_inkml_file(inkml_path)
+            # Convert to model input format
+            # This is a simplified version - actual implementation would need
+            # proper feature extraction and tensor conversion
+            # For now, return placeholder
+            predicted_latex = "\\placeholder"
+            # Apply corrector if enabled
+            if self.use_corrector and correct_latex:
+                try:
+                    predicted_latex = correct_latex(predicted_latex)
+                except Exception as e:
+                    print(f"Corrector error: {e}")
+            return predicted_latex, ground_truth
+        except Exception as e:
+            print(f"Error transcribing InkML: {e}")
+            return "", ""
+    def transcribe_image(self, image_path: str) -> str:
+        """
+        Transcribe a handwritten math image to LaTeX.
+        Note: This is a placeholder - actual implementation would require
+        image preprocessing and conversion to InkML or direct image processing.
+        Args:
+            image_path: Path to image file
+        Returns:
+            Predicted LaTeX string
+        """
+        # This would require additional image processing
+        # For now, return placeholder
+        return "\\placeholder"
+    def is_model_loaded(self) -> bool:
+        """
+        Check if model is loaded.
+        Returns:
+            True if model is loaded, False otherwise
+        """
+        return self.model is not None