Binary_classifier / classifier_api.py

Upload 5 files

88b8fd6 verified 7 months ago

5.2 kB

	from fastapi import FastAPI, HTTPException
	from pydantic import BaseModel, Field
	from typing import List, Dict, Optional
	import logging
	from pathlib import Path
	import sys
	import os
	from huggingface_hub import snapshot_download

	# Add parent directory to path for imports
	sys.path.append(str(Path(__file__).parent))

	from binary_classifier import CBTBinaryClassifier

	# Configure logging
	logging.basicConfig(level=logging.INFO)
	logger = logging.getLogger(__name__)

	# Create FastAPI app
	app = FastAPI(
	title="CBT Binary Classifier API",
	description="API for detecting CBT-triggering conversations",
	version="1.0.0"
	)

	# Request/Response models
	class TextRequest(BaseModel):
	text: str = Field(..., description="Text to classify")
	threshold: float = Field(0.7, description="Confidence threshold for CBT trigger detection")

	class BatchTextRequest(BaseModel):
	texts: List[str] = Field(..., description="List of texts to classify")
	threshold: float = Field(0.7, description="Confidence threshold for CBT trigger detection")

	class PredictionResponse(BaseModel):
	is_cbt_trigger: bool
	confidence: float
	threshold: float
	text: Optional[str] = None

	class BatchPredictionResponse(BaseModel):
	predictions: List[PredictionResponse]

	# Initialize classifier
	classifier = None

	@app.on_event("startup")
	async def startup_event():
	"""Load the model on startup"""
	global classifier
	try:
	classifier = CBTBinaryClassifier()

	# Try to load from Hugging Face Hub first
	hf_model_id = os.getenv("HF_MODEL_ID", "SaitejaJate/Binary_classifier")
	local_model_path = Path(__file__).parent / "cbt_classifier"

	# Check if we should use local model or download from HF
	use_local = os.getenv("USE_LOCAL_MODEL", "false").lower() == "true"

	if use_local and local_model_path.exists():
	# Use local model
	classifier.load_model(str(local_model_path))
	logger.info(f"Model loaded successfully from local path: {local_model_path}")
	else:
	# Download from Hugging Face Hub
	logger.info(f"Downloading model from Hugging Face Hub: {hf_model_id}")
	cache_dir = Path(__file__).parent / "model_cache"

	# Download model files
	model_path = snapshot_download(
	repo_id=hf_model_id,
	cache_dir=str(cache_dir),
	local_dir=str(cache_dir / "downloaded_model")
	)

	classifier.load_model(model_path)
	logger.info(f"Model loaded successfully from Hugging Face Hub")

	except Exception as e:
	logger.error(f"Failed to load model: {e}")
	raise

	@app.get("/")
	async def root():
	"""Health check endpoint"""
	return {
	"status": "active",
	"service": "CBT Binary Classifier API",
	"model_loaded": classifier is not None
	}

	@app.post("/classify", response_model=PredictionResponse)
	async def classify_text(request: TextRequest):
	"""Classify a single text"""
	try:
	if classifier is None:
	raise HTTPException(status_code=503, detail="Model not loaded")

	result = classifier.predict(request.text, request.threshold)

	return PredictionResponse(
	is_cbt_trigger=result['is_cbt_trigger'],
	confidence=result['confidence'],
	threshold=result['threshold'],
	text=request.text[:100] + "..." if len(request.text) > 100 else request.text
	)
	except Exception as e:
	logger.error(f"Classification error: {e}")
	raise HTTPException(status_code=500, detail=str(e))

	@app.post("/classify/batch", response_model=BatchPredictionResponse)
	async def classify_batch(request: BatchTextRequest):
	"""Classify multiple texts"""
	try:
	if classifier is None:
	raise HTTPException(status_code=503, detail="Model not loaded")

	results = classifier.batch_predict(request.texts, request.threshold)

	predictions = []
	for i, result in enumerate(results):
	text_preview = request.texts[i][:100] + "..." if len(request.texts[i]) > 100 else request.texts[i]
	predictions.append(PredictionResponse(
	is_cbt_trigger=result['is_cbt_trigger'],
	confidence=result['confidence'],
	threshold=result['threshold'],
	text=text_preview
	))

	return BatchPredictionResponse(predictions=predictions)
	except Exception as e:
	logger.error(f"Batch classification error: {e}")
	raise HTTPException(status_code=500, detail=str(e))

	@app.get("/model/info")
	async def model_info():
	"""Get information about the loaded model"""
	if classifier is None:
	raise HTTPException(status_code=503, detail="Model not loaded")

	return {
	"model_name": classifier.model_name,
	"model_path": str(Path(__file__).parent / "cbt_classifier"),
	"status": "loaded"
	}

	if __name__ == "__main__":
	import uvicorn
	uvicorn.run(app, host="0.0.0.0", port=8001)