Spaces:

tabito123
/

gohan-api-light

Runtime error

App Files Files Community

tabito12345678910 commited on Sep 2, 2025

Commit

45c2088

1 Parent(s): 8e060d3

Migrate from Gradio to FastAPI - adds /status endpoint and cold start handling while maintaining exact same API functionality

Browse files

Files changed (3) hide show

README.md +30 -27
app.py +161 -129
requirements.txt +4 -1

README.md CHANGED Viewed

@@ -1,31 +1,34 @@
----
-title: Gohan Product Recommendation API
-emoji: 🍚
-colorFrom: red
-colorTo: yellow
-sdk: gradio
-sdk_version: "4.44.0"
-app_file: app.py
-pinned: false
----
-# 🍚 Gohan Product Recommendation API
-Clean API template for rice product recommendations.
-## Setup
-1. Add your model files to a 'model/' directory
-2. Add encoder JSON files to 'model/gohan/'
-3. Update paths in app.py and inference script
-4. Deploy to HuggingFace Spaces
 ## Usage
-This API provides product recommendations for rice products based on company data.
-## Current Status
-⚠️ **Template Mode** - Add your trained model file to enable predictions
-**Required files to add:**
-- `model/gohan/epoch_012_p50_0.5836.pt` (PyTorch model)
-- `model/gohan/*.json` (encoder files) ✅ Already included
-- `model/gohan/gohan_pm.csv` (product master data) ✅ Already included

+# Gohan FastAPI
+This is a FastAPI-based product recommendation API deployed on Hugging Face Spaces.
+## Endpoints
+- `GET /` - Root endpoint with API information
+- `GET /status` - Health check and model status
+- `POST /predict` - Main prediction endpoint with topK parameter
+- `POST /predict_simple` - Simple prediction endpoint
 ## Usage
+### Check API Status
+```bash
+curl "https://your-space-url.hf.space/status"
+```
+### Make Predictions
+```bash
+curl -X POST "https://your-space-url.hf.space/predict" \
+  -H "Content-Type: application/json" \
+  -d '{"company_data_json": "{...}", "topK": 10}'
+```
+## Model Loading
+The API uses FastAPI's lifespan events to load models only once during startup, providing efficient cold start handling.
+## Required Model Files
+- `model/gohan/epoch_*.pt` (PyTorch model)
+- `model/gohan/*.json` (encoder files)
+- `model/gohan/gohan_pm.csv` (product master data)

app.py CHANGED Viewed

@@ -1,59 +1,149 @@
 #!/usr/bin/env python3
 """
-Gohan (CID) Product Recommendation Gradio App - Light Version
-Gradio interface for the Gohan CID inference engine
-This is a template - add your model files to make it functional
 """
-import gradio as gr
 import json
 import os
-# Model paths - UPDATE THESE when you add your model files
-MODEL_PATH = "model/gohan/epoch_009_p50_0.5776.pt"
 ENCODERS_DIR = "model/gohan"
 PRODUCT_MASTER_PATH = "model/gohan/gohan_pm.csv"
-# Check if model files exist
-model_files_exist = all([
-    os.path.exists(MODEL_PATH),
-    os.path.exists(ENCODERS_DIR),
-    os.path.exists(PRODUCT_MASTER_PATH)
-])
-if model_files_exist:
-    try:
-        from inference_gohan_cid import GohanCIDInferenceEngine
-        engine = GohanCIDInferenceEngine(
-            model_path=MODEL_PATH,
-            encoders_dir=ENCODERS_DIR,
-            product_master_path=PRODUCT_MASTER_PATH
-        )
-        print("✅ Gohan CID model loaded successfully!")
-    except Exception as e:
-        print(f"❌ Failed to load Gohan CID model: {e}")
         engine = None
-else:
-    print("⚠️  Model files not found. This is a template - add your model files to:")
-    print(f"   - {MODEL_PATH}")
-    print(f"   - {ENCODERS_DIR}/*.json")
-    print(f"   - {PRODUCT_MASTER_PATH}")
-    engine = None
 REQUIRED_FIELDS_EN = [
     'INDUSTRY', 'EMPLOYEE_RANGE', 'FRIDGE_RANGE', 'PAYMENT_METHOD', 'PREFECTURE',
     'FIRST_YEAR', 'FIRST_MONTH', 'LAT', 'LONG', 'DELIVERY_NUM', 'MEDIAN_GENDER_RATIO',
     'MODE_TOP_AGE_RANGE_1', 'MODE_TOP_AGE_RANGE_2', 'MODE_TOP_AGE_RANGE_3'
 ]
-def predict(company_data_json: str, topK: int | None = None) -> str:
     """
     Predict gohan categories for a company (CID-based)
-    Args:
-        company_data_json: JSON string containing company information
-        topK: Optional override for number of recommendations
-    Returns:
-        JSON string with predictions
     """
     try:
         if engine is None:
@@ -62,41 +152,33 @@ def predict(company_data_json: str, topK: int | None = None) -> str:
             else:
                 error_msg = "Model files not found - this is a template. Add your model files to enable predictions."
-            return json.dumps({
-                "status": "error",
-                "error": error_msg,
-                "model": "gohan",
-                "setup_instructions": {
-                    "model_file": MODEL_PATH,
-                    "encoders_dir": ENCODERS_DIR,
-                    "product_master": PRODUCT_MASTER_PATH
-                }
-            }, indent=2)
         # Parse input
         try:
-            incoming = json.loads(company_data_json)
         except json.JSONDecodeError as e:
-            return json.dumps({
-                "status": "error",
-                "error": f"Invalid JSON format: {str(e)}",
-                "model": "gohan"
-            })
         # topK handling
-        if topK is not None and topK > 0:
-            incoming["topK"] = int(topK)
         else:
             incoming.setdefault("topK", 30)
         # Validate English field presence
         missing_en = [f for f in REQUIRED_FIELDS_EN if f not in incoming]
         if missing_en:
-            return json.dumps({
-                "status": "error",
-                "error": f"Missing required fields: {missing_en}",
-                "model": "gohan"
-            })
         # Predict
         recommendations = engine.predict(incoming)
@@ -104,80 +186,30 @@ def predict(company_data_json: str, topK: int | None = None) -> str:
         if len(recommendations) > requested_k:
             recommendations = recommendations[:requested_k]
-        return json.dumps({
-            "status": "success",
-            "model": "gohan",
-            "recommendations": recommendations,
-            "metadata": {
                 "model_version": "gohan_cid_v1.0",
                 "total_categories": len(recommendations),
                 "requested_k": requested_k
             }
-        }, ensure_ascii=False, indent=2)
-    except Exception as e:
-        return json.dumps({
-            "status": "error",
-            "error": str(e),
-            "model": "gohan"
-        })
-def predict_simple(company_data_json: str) -> str:
-    return predict(company_data_json, None)
-# Sample input for testing
-sample_input = json.dumps({
-    "INDUSTRY": "finance",
-    "EMPLOYEE_RANGE": "200-1000",
-    "FRIDGE_RANGE": "100-500",
-    "PAYMENT_METHOD": "card",
-    "PREFECTURE": "osaka",
-    "FIRST_YEAR": 2019,
-    "FIRST_MONTH": 6,
-    "LAT": 34.6937,
-    "LONG": 135.5023,
-    "DELIVERY_NUM": 300,
-    "MEDIAN_GENDER_RATIO": 0.55,
-    "MODE_TOP_AGE_RANGE_1": "40-49",
-    "MODE_TOP_AGE_RANGE_2": "30-39",
-    "MODE_TOP_AGE_RANGE_3": "50-59"
-}, indent=2)
-with gr.Blocks(title="Gohan CID Product Recommendation API (Light)") as demo:
-    gr.Markdown("# 🍚 Gohan Product Recommendation API (Light Template)")
-    if model_files_exist:
-        gr.Markdown("✅ **Model Status**: Loaded and ready")
-    else:
-        gr.Markdown("""
-        ⚠️ **Model Status**: Template mode - add your model files to enable predictions
-        **Required files to add:**
-        - `model/gohan/epoch_009_p50_0.5776.pt` (PyTorch model)
-        - `model/gohan/*.json` (encoder files)
-        - `model/gohan/gohan_pm.csv` (product master data)
-        """)
-    gr.Markdown("Enter company data as JSON to get rice product recommendations.")
-    with gr.Tab("Main API"):
-        with gr.Row():
-            with gr.Column():
-                inp = gr.Textbox(label="Company Data (JSON)", lines=15, value=sample_input)
-                topk = gr.Number(label="Top K Results (optional)", minimum=1, maximum=200, step=1, value=None)
-                btn = gr.Button("Get Recommendations", variant="primary")
-            with gr.Column():
-                out = gr.Textbox(label="API Response", lines=20, interactive=False)
-    with gr.Tab("Simple API"):
-        with gr.Row():
-            with gr.Column():
-                inp2 = gr.Textbox(label="Company Data (JSON)", lines=15, value=sample_input)
-                btn2 = gr.Button("Get Recommendations", variant="primary")
-            with gr.Column():
-                out2 = gr.Textbox(label="API Response", lines=20, interactive=False)
-    btn.click(fn=predict, inputs=[inp, topk], outputs=out)
-    btn2.click(fn=predict_simple, inputs=inp2, outputs=out2)
 if __name__ == "__main__":
-    demo.launch(server_name="0.0.0.0", server_port=7860, show_api=True)

 #!/usr/bin/env python3
 """
+Gohan (CID) Product Recommendation FastAPI App
+FastAPI version of the Gohan CID inference engine
+This maintains the exact same functionality as the Gradio version
 """
+from fastapi import FastAPI, HTTPException
+from pydantic import BaseModel
+from contextlib import asynccontextmanager
 import json
 import os
+import time
+from typing import List, Optional, Dict, Any
+# Import the existing inference engine
+try:
+    from gohan_cid import GohanCIDInferenceEngine
+except ImportError:
+    GohanCIDInferenceEngine = None
+# Model paths - same as Gradio version
+MODEL_PATH = "model/gohan/epoch_028_p50_0.6911.pt" if "gohan" == "yasai" else "model/gohan/epoch_009_p50_0.5776.pt"
 ENCODERS_DIR = "model/gohan"
 PRODUCT_MASTER_PATH = "model/gohan/gohan_pm.csv"
+# Pydantic models matching the exact API structure
+class PredictionRequest(BaseModel):
+    company_data_json: str
+    topK: Optional[int] = None
+class CategoryRecommendation(BaseModel):
+    category_id: int
+    category_name: str
+    score: float
+class PredictionResponse(BaseModel):
+    status: str
+    model: str
+    recommendations: List[CategoryRecommendation]
+    metadata: Dict[str, Any]
+# Global variables
+engine = None
+model_files_exist = False
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    global engine, model_files_exist
+    print(f"🚀 Gohan FastAPI is starting. Loading AI model and data...")
+    start_time = time.time()
+    # Check if model files exist (same logic as Gradio version)
+    model_files_exist = all([
+        os.path.exists(MODEL_PATH),
+        os.path.exists(ENCODERS_DIR),
+        os.path.exists(PRODUCT_MASTER_PATH)
+    ])
+    if model_files_exist:
+        print(f"🔍 Checking model files:")
+        print(f"   - MODEL_PATH: {MODEL_PATH} (exists: {os.path.exists(MODEL_PATH)})")
+        print(f"   - ENCODERS_DIR: {ENCODERS_DIR} (exists: {os.path.exists(ENCODERS_DIR)})")
+        print(f"   - PRODUCT_MASTER_PATH: {PRODUCT_MASTER_PATH} (exists: {os.path.exists(PRODUCT_MASTER_PATH)})")
+        try:
+            if GohanCIDInferenceEngine:
+                engine = GohanCIDInferenceEngine(
+                    model_path=MODEL_PATH,
+                    encoders_dir=ENCODERS_DIR,
+                    product_master_path=PRODUCT_MASTER_PATH
+                )
+                print(f"✅ {app_name.title()} CID model loaded successfully!")
+            else:
+                print(f"❌ {app_name.title()}CIDInferenceEngine not available")
+                engine = None
+        except Exception as e:
+            print(f"❌ Failed to load {app_name.title()} CID model: {e}")
+            engine = None
+    else:
+        print(f"⚠️  Model files not found. This is a template - add your model files to:")
+        print(f"   - {MODEL_PATH}")
+        print(f"   - {ENCODERS_DIR}/*.json")
+        print(f"   - {PRODUCT_MASTER_PATH}")
         engine = None
+    print(f"✅ Startup completed in {time.time() - start_time:.2f} seconds.")
+    yield
+    print(f"🔄 {app_name.title()} FastAPI is shutting down.")
+# Initialize FastAPI app with lifespan
+app = FastAPI(
+    title=f"{app_name.title()} Product Recommendation API",
+    description=f"FastAPI version of the {app_name.title()} recommendation system - maintains exact same functionality as Gradio version",
+    version="2.0.0",
+    lifespan=lifespan
+)
+# Target input fields (same as Gradio version)
 REQUIRED_FIELDS_EN = [
     'INDUSTRY', 'EMPLOYEE_RANGE', 'FRIDGE_RANGE', 'PAYMENT_METHOD', 'PREFECTURE',
     'FIRST_YEAR', 'FIRST_MONTH', 'LAT', 'LONG', 'DELIVERY_NUM', 'MEDIAN_GENDER_RATIO',
     'MODE_TOP_AGE_RANGE_1', 'MODE_TOP_AGE_RANGE_2', 'MODE_TOP_AGE_RANGE_3'
 ]
+@app.get("/")
+def root():
+    return {
+        "message": f"🍚 {app_name.title()} Product Recommendation API (FastAPI)",
+        "status": "running",
+        "version": "2.0.0",
+        "endpoints": ["/status", "/predict", "/predict_simple"],
+        "model_status": "loaded" if engine else "not_loaded",
+        "model_files_exist": model_files_exist
+    }
+@app.get("/status")
+def get_status():
+    if engine is None:
+        if model_files_exist:
+            raise HTTPException(
+                status_code=503,
+                detail="Model not loaded - check model files"
+            )
+        else:
+            raise HTTPException(
+                status_code=503,
+                detail="Model files not found - this is a template. Add your model files to enable predictions."
+            )
+    return {
+        "status": "ready",
+        "model_loaded": engine is not None,
+        "model_files_exist": model_files_exist,
+        "model_path": MODEL_PATH,
+        "encoders_dir": ENCODERS_DIR,
+        "product_master_path": PRODUCT_MASTER_PATH
+    }
+@app.post("/predict", response_model=PredictionResponse)
+def predict(request: PredictionRequest):
     """
     Predict gohan categories for a company (CID-based)
+    This is the EXACT same logic as the Gradio version
     """
     try:
         if engine is None:
             else:
                 error_msg = "Model files not found - this is a template. Add your model files to enable predictions."
+            raise HTTPException(
+                status_code=503,
+                detail=error_msg
+            )
         # Parse input
         try:
+            incoming = json.loads(request.company_data_json)
         except json.JSONDecodeError as e:
+            raise HTTPException(
+                status_code=400,
+                detail=f"Invalid JSON format: {str(e)}"
+            )
         # topK handling
+        if request.topK is not None and request.topK > 0:
+            incoming["topK"] = int(request.topK)
         else:
             incoming.setdefault("topK", 30)
         # Validate English field presence
         missing_en = [f for f in REQUIRED_FIELDS_EN if f not in incoming]
         if missing_en:
+            raise HTTPException(
+                status_code=400,
+                detail=f"Missing required fields: {missing_en}"
+            )
         # Predict
         recommendations = engine.predict(incoming)
         if len(recommendations) > requested_k:
             recommendations = recommendations[:requested_k]
+        return PredictionResponse(
+            status="success",
+            model="gohan",
+            recommendations=recommendations,
+            metadata={
                 "model_version": "gohan_cid_v1.0",
                 "total_categories": len(recommendations),
                 "requested_k": requested_k
             }
+        )
+    except HTTPException:
+        raise
+    except Exception as e:
+        raise HTTPException(
+            status_code=500,
+            detail=f"Prediction error: {str(e)}"
+        )
+@app.post("/predict_simple", response_model=PredictionResponse)
+def predict_simple(request: PredictionRequest):
+    """Simple endpoint without topK parameter - same as Gradio version"""
+    return predict(request)
 if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=7860)

requirements.txt CHANGED Viewed

@@ -1,6 +1,9 @@
-gradio>=4.0.0
 torch==2.8.0
 git+https://github.com/Yura52/rtdl.git@main
 pandas
 numpy
 scipy

+fastapi==0.104.1
+uvicorn[standard]==0.24.0
+pydantic==2.5.0
 torch==2.8.0
 git+https://github.com/Yura52/rtdl.git@main
 pandas
 numpy
 scipy
+python-multipart==0.0.6