Spaces:

saemstunes
/

STA-AI

Running

App Files Files Community

saemstunes commited on Sep 29, 2025

Commit

e99e7d4

verified ·

1 Parent(s): abbebe0

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -15

app.py CHANGED Viewed

@@ -357,6 +357,7 @@ def create_gradio_interface():
 def setup_api_endpoints(demo):
     from fastapi import FastAPI, HTTPException
     from pydantic import BaseModel
     from typing import Optional
@@ -372,8 +373,9 @@ def setup_api_endpoints(demo):
         timestamp: str
         model_used: str
     @demo.app.post("/api/chat")
-    async def api_chat(request: ChatRequest):
         try:
             if not request.message.strip():
                 raise HTTPException(status_code=400, detail="Message cannot be empty")
@@ -386,13 +388,13 @@ def setup_api_endpoints(demo):
             response = ai_system.process_query(request.message, request.user_id, request.conversation_id)
             processing_time = time.time() - start_time
-            return ChatResponse(
-                response=response,
-                processing_time=processing_time,
-                conversation_id=request.conversation_id or f"conv_{int(time.time())}",
-                timestamp=datetime.now().isoformat(),
-                model_used=Config.MODEL_NAME
-            )
         except HTTPException:
             raise
@@ -400,32 +402,46 @@ def setup_api_endpoints(demo):
             logger.error(f"API chat error: {e}")
             raise HTTPException(status_code=500, detail="Internal server error")
     @demo.app.get("/api/health")
-    async def api_health():
-        return get_system_status()
     @demo.app.get("/api/models")
-    async def api_models():
-        return {
             "available_models": ["microsoft/Phi-3.5-mini-instruct"],
             "current_model": Config.MODEL_NAME,
             "quantization": "Q4_K_M",
             "context_length": 4096,
             "parameters": "3.8B"
         }
     @demo.app.get("/api/stats")
-    async def api_stats():
         if not monitor:
-            return {"error": "Monitoring system not available"}
-        return {
             "total_requests": len(monitor.inference_metrics),
             "average_response_time": monitor.get_average_response_time(),
             "error_rate": monitor.get_error_rate(),
             "uptime": monitor.get_uptime(),
             "system_health": get_system_status()
         }
 if __name__ == "__main__":
     logger.info("🎵 Starting Saem's Tunes AI on Hugging Face Spaces...")

 def setup_api_endpoints(demo):
     from fastapi import FastAPI, HTTPException
+    from fastapi.responses import JSONResponse
     from pydantic import BaseModel
     from typing import Optional
         timestamp: str
         model_used: str
+    # FIX: Remove async from endpoints that don't need it
     @demo.app.post("/api/chat")
+    def api_chat(request: ChatRequest):  # Remove async
         try:
             if not request.message.strip():
                 raise HTTPException(status_code=400, detail="Message cannot be empty")
             response = ai_system.process_query(request.message, request.user_id, request.conversation_id)
             processing_time = time.time() - start_time
+            return JSONResponse(content={
+                "response": response,
+                "processing_time": processing_time,
+                "conversation_id": request.conversation_id or f"conv_{int(time.time())}",
+                "timestamp": datetime.now().isoformat(),
+                "model_used": Config.MODEL_NAME
+            })
         except HTTPException:
             raise
             logger.error(f"API chat error: {e}")
             raise HTTPException(status_code=500, detail="Internal server error")
+    # FIX: Remove async and use direct dict return
     @demo.app.get("/api/health")
+    def api_health():  # Remove async
+        try:
+            status_data = get_system_status()
+            return status_data  # FastAPI automatically converts dict to JSON
+        except Exception as e:
+            logger.error(f"Health endpoint error: {e}")
+            return JSONResponse(
+                content={"status": "error", "error": str(e)},
+                status_code=500
+            )
     @demo.app.get("/api/models")
+    def api_models():  # Remove async
+        models_info = {
             "available_models": ["microsoft/Phi-3.5-mini-instruct"],
             "current_model": Config.MODEL_NAME,
             "quantization": "Q4_K_M",
             "context_length": 4096,
             "parameters": "3.8B"
         }
+        return models_info  # FastAPI automatically converts dict to JSON
     @demo.app.get("/api/stats")
+    def api_stats():  # Remove async
         if not monitor:
+            return JSONResponse(
+                content={"error": "Monitoring system not available"},
+                status_code=503
+            )
+        stats_data = {
             "total_requests": len(monitor.inference_metrics),
             "average_response_time": monitor.get_average_response_time(),
             "error_rate": monitor.get_error_rate(),
             "uptime": monitor.get_uptime(),
             "system_health": get_system_status()
         }
+        return stats_data  # FastAPI automatically converts dict to JSON
 if __name__ == "__main__":
     logger.info("🎵 Starting Saem's Tunes AI on Hugging Face Spaces...")