Spaces:

m93
/

sentiment.api

Sleeping

App Files Files Community

m93 commited on Mar 20

Commit

986654d

verified ·

1 Parent(s): 12e8a63

Create app.py

Browse files

Files changed (1) hide show

app.py +147 -0

app.py ADDED Viewed

	@@ -0,0 +1,147 @@

+# app.py - Deploy this to Hugging Face Spaces
+# Install: pip install fastapi uvicorn torch transformers huggingface_hub
+import json
+import os
+from pathlib import Path
+import torch
+import torch.nn as nn
+from fastapi import FastAPI, HTTPException
+from huggingface_hub import hf_hub_download
+from pydantic import BaseModel
+from transformers import AutoModel, AutoTokenizer
+app = FastAPI(title="Sentiment Analysis API")
+# Global variables for lazy loading
+model = None
+tokenizer = None
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+# Model definition (must match training code)
+class SentimentClassifier(nn.Module):
+    def __init__(self):
+        super().__init__()
+        self.bert = AutoModel.from_pretrained("distilbert-base-uncased")
+        self.dropout = nn.Dropout(0.3)
+        self.classifier = nn.Linear(768, 2)
+    def forward(self, input_ids, attention_mask, **kwargs):
+        outputs = self.bert(input_ids=input_ids, attention_mask=attention_mask)
+        pooled = outputs.last_hidden_state[:, 0]
+        x = self.dropout(pooled)
+        return self.classifier(x)
+# Request/Response models
+class PredictionRequest(BaseModel):
+    text: str
+class PredictionResponse(BaseModel):
+    sentiment: str
+    confidence: float
+def load_model_from_hf(repo_id: str):
+    """Load model from Hugging Face on-demand"""
+    global model, tokenizer
+    if model is not None:
+        return  # Already loaded
+    print(f"📥 Loading model from {repo_id}...")
+    # Download model files
+    cache_dir = "./model_cache"
+    Path(cache_dir).mkdir(exist_ok=True)
+    model_path = hf_hub_download(
+        repo_id=repo_id, filename="model.pt", cache_dir=cache_dir
+    )
+    config_path = hf_hub_download(
+        repo_id=repo_id, filename="config.json", cache_dir=cache_dir
+    )
+    # Load tokenizer
+    tokenizer = AutoTokenizer.from_pretrained(repo_id, cache_dir=cache_dir)
+    # Load model
+    model = SentimentClassifier()
+    model.load_state_dict(torch.load(model_path, map_location=device))
+    model.to(device)
+    model.eval()
+    print(f"✅ Model loaded successfully on {device}")
+@app.on_event("startup")
+async def startup_event():
+    """Load model when server starts"""
+    # Read from environment variable or use default
+    REPO_ID = os.environ.get("MODEL_REPO_ID", "m93/sentiment-model")
+    load_model_from_hf(REPO_ID)
+@app.get("/")
+def root():
+    return {
+        "message": "Sentiment Analysis API",
+        "status": "running",
+        "endpoints": {
+            "/predict": "POST - Analyze sentiment of text",
+            "/health": "GET - Check if model is loaded",
+            "/docs": "GET - Interactive API documentation",
+        },
+    }
+@app.get("/health")
+def health_check():
+    return {
+        "status": "healthy",
+        "model_loaded": model is not None,
+        "device": str(device),
+    }
+@app.post("/predict", response_model=PredictionResponse)
+def predict(request: PredictionRequest):
+    if model is None or tokenizer is None:
+        raise HTTPException(status_code=503, detail="Model not loaded")
+    try:
+        # Tokenize input
+        inputs = tokenizer(
+            request.text,
+            return_tensors="pt",
+            padding=True,
+            truncation=True,
+            max_length=512,
+        )
+        inputs = {k: v.to(device) for k, v in inputs.items()}
+        # Get prediction
+        with torch.no_grad():
+            outputs = model(**inputs)
+            probs = torch.softmax(outputs, dim=1)
+            prediction = torch.argmax(probs, dim=1).item()
+            confidence = probs[0][prediction].item()
+        sentiment = "positive" if prediction == 1 else "negative"
+        return PredictionResponse(sentiment=sentiment, confidence=round(confidence, 4))
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+if __name__ == "__main__":
+    import uvicorn
+    port = int(os.environ.get("PORT", 7860))  # HF Spaces uses port 7860
+    print("🚀 Starting API server...")
+    uvicorn.run(app, host="0.0.0.0", port=port)