Spaces:

MdSourav76046
/

TextCorrectionModel

Runtime error

App Files Files Community

MdSourav76046 commited on Oct 20, 2025

Commit

5aa4532

verified ·

1 Parent(s): 06b80ad

Delete app.py

Browse files

Files changed (1) hide show

app.py +0 -176

app.py DELETED Viewed

@@ -1,176 +0,0 @@
-"""
-FastAPI Server for Text Correction
-Deploy this to run your text correction model as an API
-"""
-from fastapi import FastAPI, HTTPException
-from fastapi.middleware.cors import CORSMiddleware
-from pydantic import BaseModel
-from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
-import torch
-import os
-from typing import Optional
-# Initialize FastAPI app
-app = FastAPI(
-    title="Text Correction API",
-    description="API for correcting OCR text using trained model",
-    version="1.0.0"
-)
-# Add CORS middleware to allow requests from iOS app
-app.add_middleware(
-    CORSMiddleware,
-    allow_origins=["*"],  # In production, specify your iOS app's domain
-    allow_credentials=True,
-    allow_methods=["*"],
-    allow_headers=["*"],
-)
-# Global variables for model
-model = None
-tokenizer = None
-device = None
-# Pydantic models for request/response
-class TextRequest(BaseModel):
-    text: str
-class TextResponse(BaseModel):
-    corrected_text: str
-    processing_time: float
-class HealthResponse(BaseModel):
-    status: str
-    model_loaded: bool
-    device: str
-# Load model at startup
-@app.on_event("startup")
-async def load_model():
-    global model, tokenizer, device
-    print("🚀 Starting Text Correction API...")
-    # Determine device
-    device = "cuda" if torch.cuda.is_available() else "cpu"
-    print(f"📱 Using device: {device}")
-    # Load model and tokenizer
-    try:
-        model_path = os.getenv("MODEL_PATH", "./gpu_base_model2")
-        print(f"📦 Loading model from: {model_path}")
-        model = AutoModelForSeq2SeqLM.from_pretrained(model_path)
-        tokenizer = AutoTokenizer.from_pretrained(model_path)
-        # Move model to device
-        model.to(device)
-        model.eval()
-        print("✅ Model loaded successfully!")
-        print(f"   - Model type: {type(model).__name__}")
-        print(f"   - Vocabulary size: {tokenizer.vocab_size}")
-        print(f"   - Device: {device}")
-    except Exception as e:
-        print(f"❌ Error loading model: {e}")
-        print("⚠️  API will not work until model is loaded")
-# Health check endpoint
-@app.get("/health", response_model=HealthResponse)
-async def health_check():
-    """Check if the API and model are ready"""
-    return HealthResponse(
-        status="healthy" if model is not None else "unhealthy",
-        model_loaded=model is not None,
-        device=device or "unknown"
-    )
-# Text correction endpoint
-@app.post("/correct", response_model=TextResponse)
-async def correct_text(request: TextRequest):
-    """
-    Correct text using the trained model
-    Args:
-        request: TextRequest containing the text to correct
-    Returns:
-        TextResponse with corrected text and processing time
-    """
-    import time
-    if model is None or tokenizer is None:
-        raise HTTPException(
-            status_code=503,
-            detail="Model not loaded. Please wait for the model to initialize."
-        )
-    if not request.text or not request.text.strip():
-        raise HTTPException(
-            status_code=400,
-            detail="Text cannot be empty"
-        )
-    start_time = time.time()
-    try:
-        # Tokenize input text
-        inputs = tokenizer(
-            request.text,
-            return_tensors="pt",
-            max_length=512,
-            truncation=True,
-            padding=True
-        ).to(device)
-        # Generate corrected text
-        with torch.no_grad():
-            outputs = model.generate(
-                inputs.input_ids,
-                attention_mask=inputs.attention_mask,
-                max_length=512,
-                num_beams=5,
-                early_stopping=True,
-                pad_token_id=tokenizer.pad_token_id,
-                eos_token_id=tokenizer.eos_token_id
-            )
-        # Decode output
-        corrected_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
-        processing_time = time.time() - start_time
-        print(f"✅ Text corrected in {processing_time:.2f}s")
-        print(f"   Input: {request.text[:50]}...")
-        print(f"   Output: {corrected_text[:50]}...")
-        return TextResponse(
-            corrected_text=corrected_text,
-            processing_time=round(processing_time, 2)
-        )
-    except Exception as e:
-        print(f"❌ Error during correction: {e}")
-        raise HTTPException(
-            status_code=500,
-            detail=f"Text correction failed: {str(e)}"
-        )
-# Root endpoint
-@app.get("/")
-async def root():
-    return {
-        "message": "Text Correction API",
-        "version": "1.0.0",
-        "endpoints": {
-            "health": "/health",
-            "correct": "/correct (POST)"
-        }
-    }
-if __name__ == "__main__":
-    import uvicorn
-    uvicorn.run(app, host="0.0.0.0", port=8000)