Spaces:

TeamGenKI
/

Inference-API

Runtime error

App Files Files Community

AurelioAguirre commited on Jan 10, 2025

Commit

baae755

1 Parent(s): c6b21e3

changed to uvicorn setup for HF v2

Browse files

Files changed (1) hide show

main/main.py +34 -58

main/main.py CHANGED Viewed

@@ -6,7 +6,6 @@ import yaml
 import logging
 import asyncio
 from pathlib import Path
-from fastapi import FastAPI
 from fastapi.middleware.cors import CORSMiddleware
 from .routes import router, init_router
 from .api import InferenceApi
@@ -25,68 +24,45 @@ def load_config():
     with open(config_path) as f:
         return yaml.safe_load(f)
-async def init_app() -> tuple[FastAPI, InferenceApi, dict]:
-    """Initialize and configure the FastAPI application."""
-    logger = setup_logging()
-    try:
-        # Load configuration
-        config = load_config()
-        server_config = config.get('server', {})
-        # Initialize API with config
-        api = InferenceApi(config)
-        # Initialize router with the API instance
-        await init_router(api)
-        # Create LitServer instance with config
-        server = ls.LitServer(
-            api,
-            timeout=server_config.get('timeout', 60),
-            max_batch_size=server_config.get('max_batch_size', 1),
-            track_requests=True
-        )
-        # Get the FastAPI app from the LitServer
-        app = server.app
-        # Add CORS middleware
-        app.add_middleware(
-            CORSMiddleware,
-            allow_origins=["*"],
-            allow_credentials=True,
-            allow_methods=["*"],
-            allow_headers=["*"],
-        )
-        # Add routes with configured prefix
-        api_prefix = config.get('llm_server', {}).get('api_prefix', '/api/v1')
-        app.include_router(router, prefix=api_prefix)
-        return app, api, config
-    except Exception as e:
-        logger.error(f"Application initialization failed: {str(e)}")
-        raise
-# Create the FastAPI app instance for uvicorn
-app, api_instance, config_dict = asyncio.get_event_loop().run_until_complete(init_app())
 async def run_server():
     """Run the server directly (not through uvicorn)"""
-    server_config = config_dict.get('server', {})
     port = server_config.get('port', 8001)
     host = server_config.get('host', '0.0.0.0')
-    # Create LitServer instance with all required parameters
-    server = ls.LitServer(
-        api_instance,
-        timeout=server_config.get('timeout', 60),
-        max_batch_size=server_config.get('max_batch_size', 1),
-        track_requests=True
-    )
     server.run(host=host, port=port)
 def main():

 import logging
 import asyncio
 from pathlib import Path
 from fastapi.middleware.cors import CORSMiddleware
 from .routes import router, init_router
 from .api import InferenceApi
     with open(config_path) as f:
         return yaml.safe_load(f)
+# Initialize everything synchronously
+logger = setup_logging()
+config = load_config()
+server_config = config.get('server', {})
+api = InferenceApi(config)
+# Create LitServer instance
+server = ls.LitServer(
+    api,
+    timeout=server_config.get('timeout', 60),
+    max_batch_size=server_config.get('max_batch_size', 1),
+    track_requests=True
+)
+# Get the FastAPI app from LitServer
+app = server.app
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+# Add routes with configured prefix
+api_prefix = config.get('llm_server', {}).get('api_prefix', '/api/v1')
+app.include_router(router, prefix=api_prefix)
+@app.on_event("startup")
+async def startup_event():
+    """Initialize async components on startup."""
+    await init_router(api)
 async def run_server():
     """Run the server directly (not through uvicorn)"""
     port = server_config.get('port', 8001)
     host = server_config.get('host', '0.0.0.0')
     server.run(host=host, port=port)
 def main():