Spaces:

Ivanet22
/

sentiment-api

Sleeping

App Files Files Community

sentiment-api / app.py

Ivanet22

Upload 4 files

8d96cd3 verified about 2 months ago

raw

history blame contribute delete

4.23 kB

	# app.py - Deploy this to Hugging Face Spaces
	# Install: pip install fastapi uvicorn torch transformers huggingface_hub

	import json
	import os
	from pathlib import Path

	import torch
	import torch.nn as nn
	from fastapi import FastAPI, HTTPException
	from huggingface_hub import hf_hub_download
	from pydantic import BaseModel
	from transformers import AutoModel, AutoTokenizer

	app = FastAPI(title="Sentiment Analysis API")

	# Global variables for lazy loading
	model = None
	tokenizer = None
	device = torch.device("cuda" if torch.cuda.is_available() else "cpu")


	# Model definition (must match training code)
	class SentimentClassifier(nn.Module):
	def __init__(self):
	super().__init__()
	self.bert = AutoModel.from_pretrained("distilbert-base-uncased")
	self.dropout = nn.Dropout(0.3)
	self.classifier = nn.Linear(768, 2)

	def forward(self, input_ids, attention_mask, **kwargs):
	outputs = self.bert(input_ids=input_ids, attention_mask=attention_mask)
	pooled = outputs.last_hidden_state[:, 0]
	x = self.dropout(pooled)
	return self.classifier(x)


	# Request/Response models
	class PredictionRequest(BaseModel):
	text: str


	class PredictionResponse(BaseModel):
	sentiment: str
	confidence: float


	def load_model_from_hf(repo_id: str):
	"""Load model from Hugging Face on-demand"""
	global model, tokenizer

	if model is not None:
	return # Already loaded

	print(f"📥 Loading model from {repo_id}...")

	# Download model files
	cache_dir = "./model_cache"
	Path(cache_dir).mkdir(exist_ok=True)

	model_path = hf_hub_download(
	repo_id=repo_id, filename="model.pt", cache_dir=cache_dir
	)

	config_path = hf_hub_download(
	repo_id=repo_id, filename="config.json", cache_dir=cache_dir
	)

	# Load tokenizer
	tokenizer = AutoTokenizer.from_pretrained(repo_id, cache_dir=cache_dir)

	# Load model
	model = SentimentClassifier()
	model.load_state_dict(torch.load(model_path, map_location=device))
	model.to(device)
	model.eval()

	print(f"✅ Model loaded successfully on {device}")


	@app.on_event("startup")
	async def startup_event():
	"""Load model when server starts"""
	# Read from environment variable or use default
	REPO_ID = os.environ.get("MODEL_REPO_ID", "Ivanet22/sentiment-model")
	load_model_from_hf(REPO_ID)


	@app.get("/")
	def root():
	return {
	"message": "Sentiment Analysis API",
	"status": "running",
	"endpoints": {
	"/predict": "POST - Analyze sentiment of text",
	"/health": "GET - Check if model is loaded",
	"/docs": "GET - Interactive API documentation",
	},
	}


	@app.get("/health")
	def health_check():
	return {
	"status": "healthy",
	"model_loaded": model is not None,
	"device": str(device),
	}


	@app.post("/predict", response_model=PredictionResponse)
	def predict(request: PredictionRequest):
	if model is None or tokenizer is None:
	raise HTTPException(status_code=503, detail="Model not loaded")

	try:
	# Tokenize input
	inputs = tokenizer(
	request.text,
	return_tensors="pt",
	padding=True,
	truncation=True,
	max_length=512,
	)
	inputs = {k: v.to(device) for k, v in inputs.items()}

	# Get prediction
	with torch.no_grad():
	outputs = model(**inputs)
	probs = torch.softmax(outputs, dim=1)
	prediction = torch.argmax(probs, dim=1).item()
	confidence = probs[0][prediction].item()

	sentiment = "positive" if prediction == 1 else "negative"

	return PredictionResponse(sentiment=sentiment, confidence=round(confidence, 4))

	except Exception as e:
	raise HTTPException(status_code=500, detail=str(e))


	if __name__ == "__main__":
	import uvicorn

	port = int(os.environ.get("PORT", 7860)) # HF Spaces uses port 7860
	print("🚀 Starting API server...")
	uvicorn.run(app, host="0.0.0.0", port=port)