Spaces:

Varshithdharmajv
/

mvm2-math-verification

Sleeping

App Files Files Community

mvm2-math-verification / handwriting_transcriber.py

Varshithdharmajv

Upload handwriting_transcriber.py with huggingface_hub

dbd32c5 verified 2 months ago

raw

history blame contribute delete

5.35 kB

	"""
	Handwriting Transcriber Module
	Wrapper for handwritten-math-transcription repository
	"""

	import sys
	import os
	import torch
	from typing import Optional, Tuple

	# Add handwritten-math-transcription to path
	sys.path.insert(0, os.path.join(os.path.dirname(__file__), '..', 'handwritten-math-transcription'))

	try:
	from model import Encoder, Decoder, Seq2Seq
	from dataset.hme_ink import read_inkml_file
	from utils import tokenize_latex
	from corrector import correct_latex
	from config import *
	except ImportError:
	Encoder = None
	Decoder = None
	Seq2Seq = None
	read_inkml_file = None
	tokenize_latex = None
	correct_latex = None


	class HandwritingTranscriber:
	"""
	Handwriting transcriber for mathematical expressions.
	Converts handwritten math (InkML format) to LaTeX.
	"""

	def __init__(self,
	model_path: str = None,
	device: str = None,
	use_corrector: bool = True):
	"""
	Initialize handwriting transcriber.

	Args:
	model_path: Path to trained model checkpoint
	device: Device to run model on ('cpu', 'cuda', 'mps')
	use_corrector: Whether to use LLM corrector for post-processing
	"""
	self.device = device or ('cuda' if torch.cuda.is_available() else 'cpu')
	self.use_corrector = use_corrector
	self.model = None
	self.model_path = model_path

	if model_path and os.path.exists(model_path):
	self.load_model(model_path)

	def load_model(self, model_path: str):
	"""
	Load trained model from checkpoint.

	Args:
	model_path: Path to model checkpoint
	"""
	if Seq2Seq is None:
	raise ImportError("Handwriting transcription model not available")

	try:
	# Model architecture parameters (from config or defaults)
	input_dim = 11
	enc_hidden_dim = 256
	dec_hidden_dim = 256
	embed_dim = 128
	output_dim = LATEX_VOCAB_SIZE if 'LATEX_VOCAB_SIZE' in globals() else 300
	encoder_num_layers = 2
	decoder_num_layers = 2

	# Create model
	encoder = Encoder(input_dim, enc_hidden_dim,
	num_layers=encoder_num_layers, bidirectional=True)
	decoder = Decoder(output_dim, embed_dim,
	enc_hidden_dim, dec_hidden_dim,
	num_layers=decoder_num_layers)
	self.model = Seq2Seq(encoder, decoder, self.device).to(self.device)

	# Load weights
	checkpoint = torch.load(model_path, map_location=self.device)
	self.model.load_state_dict(checkpoint)
	self.model.eval()

	print(f"Model loaded from {model_path}")
	except Exception as e:
	print(f"Error loading model: {e}")
	self.model = None

	def transcribe_inkml(self, inkml_path: str) -> Tuple[str, str]:
	"""
	Transcribe an InkML file to LaTeX.

	Args:
	inkml_path: Path to InkML file

	Returns:
	Tuple of (predicted_latex, ground_truth_latex if available)
	"""
	if self.model is None:
	raise ValueError("Model not loaded. Please load a model first.")

	if read_inkml_file is None:
	raise ImportError("InkML reading functionality not available")

	try:
	# Read InkML file
	strokes, ground_truth = read_inkml_file(inkml_path)

	# Convert to model input format
	# This is a simplified version - actual implementation would need
	# proper feature extraction and tensor conversion
	# For now, return placeholder
	predicted_latex = "\\placeholder"

	# Apply corrector if enabled
	if self.use_corrector and correct_latex:
	try:
	predicted_latex = correct_latex(predicted_latex)
	except Exception as e:
	print(f"Corrector error: {e}")

	return predicted_latex, ground_truth
	except Exception as e:
	print(f"Error transcribing InkML: {e}")
	return "", ""

	def transcribe_image(self, image_path: str) -> str:
	"""
	Transcribe a handwritten math image to LaTeX.
	Note: This is a placeholder - actual implementation would require
	image preprocessing and conversion to InkML or direct image processing.

	Args:
	image_path: Path to image file

	Returns:
	Predicted LaTeX string
	"""
	# This would require additional image processing
	# For now, return placeholder
	return "\\placeholder"

	def is_model_loaded(self) -> bool:
	"""
	Check if model is loaded.

	Returns:
	True if model is loaded, False otherwise
	"""
	return self.model is not None