Spaces:

TeamGenKI
/

LLMServer

Paused

App Files Files Community

AurelioAguirre commited on Nov 6, 2024

Commit

840a4e4

1 Parent(s): 801882a

trying again

Browse files

Files changed (1) hide show

main/main.py +33 -5

main/main.py CHANGED Viewed

@@ -13,7 +13,16 @@ from huggingface_hub.hf_api import HfApi
 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
-app = FastAPI(title="LLM Engine Service")
 # Global variable to store the LLM instance
 llm_instance = None
@@ -37,6 +46,20 @@ class GenerateRequest(BaseModel):
     return_as_token_ids: bool = False
     stream: bool = False
 @app.post("/initialize")
 async def initialize_model(request: InitializeRequest):
     """
@@ -167,12 +190,17 @@ async def health_check():
 def main():
     # Load environment variables or configuration here
     host = os.getenv("LLM_ENGINE_HOST", "0.0.0.0")
-    port = int(os.getenv("LLM_ENGINE_PORT", "8001"))
     # Start the server
-    hf_a = HfApi()
-    space_info = hf_a.space_info("TeamGenKI/LLM-Engine")
-    logger.warning(f"Exposing URL: {space_info}")
     uvicorn.run(
         app,
         host=host,

 logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
+# Initialize FastAPI with root path for Spaces
+app = FastAPI(
+    title="LLM Engine Service",
+    # This is crucial for Hugging Face Spaces
+    root_path="/",
+    # Add OpenAPI configs
+    openapi_url="/api/openapi.json",
+    docs_url="/api/docs",
+    redoc_url="/api/redoc"
+)
 # Global variable to store the LLM instance
 llm_instance = None
     return_as_token_ids: bool = False
     stream: bool = False
+@app.get("/")
+async def root():
+    """Root endpoint to verify service is running"""
+    space_url = "https://teamgenki-llm-engine.hf.space"
+    return {
+        "status": "running",
+        "service": "LLM Engine",
+        "endpoints": {
+            "initialize": f"{space_url}/initialize",
+            "generate": f"{space_url}/generate",
+            "health": f"{space_url}/health"
+        }
+    }
 @app.post("/initialize")
 async def initialize_model(request: InitializeRequest):
     """
 def main():
     # Load environment variables or configuration here
     host = os.getenv("LLM_ENGINE_HOST", "0.0.0.0")
+    port = int(os.getenv("LLM_ENGINE_PORT", "7860"))  # Changed to 7860 for Spaces
+    # Log the service URLs
+    space_url = "https://teamgenki-llm-engine.hf.space"
+    logger.info(f"Service will be available at: {space_url}")
+    logger.info(f"API endpoints:")
+    logger.info(f"  Initialize: {space_url}/initialize")
+    logger.info(f"  Generate: {space_url}/generate")
+    logger.info(f"  Health: {space_url}/health")
     # Start the server
     uvicorn.run(
         app,
         host=host,