Spaces:

karim323
/

nlp-analysis-api

Running

karim323 commited on Nov 13, 2025

Commit

b82bbd8

1 Parent(s): 936e189

Fix HF Spaces deployment: use port 7860, async model loading, immediate health checks

Files changed (3) hide show

Dockerfile CHANGED Viewed

@@ -19,9 +19,9 @@ RUN pip install --no-cache-dir --upgrade pip && \
 # Copy application code
 COPY . .
-# Expose port (Railway will override with $PORT)
-EXPOSE 8000
 # Run the application
-CMD ["python", "-m", "uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]

 # Copy application code
 COPY . .
+# Expose port (Hugging Face Spaces uses 7860)
+EXPOSE 7860
 # Run the application
+CMD ["python", "-m", "uvicorn", "main:app", "--host", "0.0.0.0", "--port", "7860"]

lib/routes.py CHANGED Viewed

@@ -59,16 +59,33 @@ async def root(request: Request):
 @limiter.limit("30/minute")
 async def health_check(request: Request):
     """Detailed health check endpoint with model status"""
-    from main import sentiment_model, ner_model, paraphrase_model, summarization_model
-    return {
-        "status": "healthy",
-        "models": {
-            "sentiment": sentiment_model.is_loaded() if sentiment_model else False,
-            "ner": ner_model.is_loaded() if ner_model else False,
-            "paraphrase": paraphrase_model.is_loaded() if paraphrase_model else False,
-            "summarization": summarization_model.is_loaded() if summarization_model else False
         }
-    }
 # Sentiment analysis endpoints

 @limiter.limit("30/minute")
 async def health_check(request: Request):
     """Detailed health check endpoint with model status"""
+    # Always return healthy - models load in background
+    # This allows HF Spaces health checks to pass immediately
+    try:
+        from main import sentiment_model, ner_model, paraphrase_model, summarization_model
+        return {
+            "status": "healthy",
+            "message": "API is running. Models may still be loading.",
+            "models": {
+                "sentiment": sentiment_model.is_loaded() if sentiment_model else False,
+                "ner": ner_model.is_loaded() if ner_model else False,
+                "paraphrase": paraphrase_model.is_loaded() if paraphrase_model else False,
+                "summarization": summarization_model.is_loaded() if summarization_model else False
+            }
+        }
+    except Exception:
+        # Even if models aren't initialized yet, return healthy
+        # This ensures HF Spaces health checks pass
+        return {
+            "status": "healthy",
+            "message": "API is starting. Models loading in background.",
+            "models": {
+                "sentiment": False,
+                "ner": False,
+                "paraphrase": False,
+                "summarization": False
+            }
         }
 # Sentiment analysis endpoints

main.py CHANGED Viewed

@@ -30,8 +30,12 @@ logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 # Get configuration from environment variables
-ALLOWED_ORIGINS = os.getenv("ALLOWED_ORIGINS", "http://localhost:8000").split(",")
-ENVIRONMENT = os.getenv("ENVIRONMENT", "development")
 logger.info(f"Starting application in {ENVIRONMENT} mode")
 logger.info(f"Allowed CORS origins: {ALLOWED_ORIGINS}")
@@ -110,10 +114,12 @@ def load_models():
     logger.info("Core models loaded successfully!")
-# Load models on startup
 @app.on_event("startup")
 async def startup_event():
-    load_models()
 # Include router

 logger = logging.getLogger(__name__)
 # Get configuration from environment variables
+# For Hugging Face Spaces, allow all origins by default
+default_origins = "*" if os.getenv("HF_SPACE_ID") else "http://localhost:8000"
+ALLOWED_ORIGINS = os.getenv("ALLOWED_ORIGINS", default_origins)
+if ALLOWED_ORIGINS != "*":
+    ALLOWED_ORIGINS = ALLOWED_ORIGINS.split(",")
+ENVIRONMENT = os.getenv("ENVIRONMENT", "production" if os.getenv("HF_SPACE_ID") else "development")
 logger.info(f"Starting application in {ENVIRONMENT} mode")
 logger.info(f"Allowed CORS origins: {ALLOWED_ORIGINS}")
     logger.info("Core models loaded successfully!")
+# Load models on startup (non-blocking for HF Spaces health checks)
 @app.on_event("startup")
 async def startup_event():
+    # Load models in background to allow health checks to respond quickly
+    import asyncio
+    asyncio.create_task(asyncio.to_thread(load_models))
 # Include router