Spaces:

thangquang09
/

Deploy_FastAPI_Space

Paused

thangquang09 commited on Mar 26, 2025

Commit

de800a4

1 Parent(s): 78f1859

update Dockerfile

Files changed (2) hide show

app.py CHANGED Viewed

@@ -12,7 +12,7 @@ class Generate(BaseModel):
     duration: float
 chat_history = []
-model = Ollama(model="phi2")
 def generate_text(model: Ollama, prompt: str) -> {}:
     if prompt == "":
@@ -58,6 +58,21 @@ def generate_text(model: Ollama, prompt: str) -> {}:
 async def root():
     return {"message": "Hello World"}
 @app.post("/api/generate", summary="Generate text from prompt", tags=["Generate"], response_model=Generate)
 def inference(input_prompt: str):
     return generate_text(model, input_prompt)

     duration: float
 chat_history = []
+model = Ollama(model="phi2", base_url="http://localhost:11434")
 def generate_text(model: Ollama, prompt: str) -> {}:
     if prompt == "":
 async def root():
     return {"message": "Hello World"}
+@app.get("/health")
+async def health_check():
+    try:
+        import requests
+        response = requests.get("http://localhost:11434/api/version")
+        ollama_status = "OK" if response.status_code == 200 else "Not available"
+    except:
+        ollama_status = "Error"
+    return {
+        "status": "healthy",
+        "ollama_status": ollama_status,
+        "models_loaded": model is not None
+    }
 @app.post("/api/generate", summary="Generate text from prompt", tags=["Generate"], response_model=Generate)
 def inference(input_prompt: str):
     return generate_text(model, input_prompt)

start.sh CHANGED Viewed

@@ -1,17 +1,38 @@
 #!/bin/bash
-# Start Ollama in the background with proper home directory
 export HOME=/root
-ollama serve &
-# Wait for Ollama to start
-echo "Waiting for Ollama to start..."
-sleep 10
-# Pull models if needed
 echo "Running pull_models.sh"
 /app/pull_models.sh
-# Start FastAPI app
 echo "Starting FastAPI application..."
 uvicorn app:app --host 0.0.0.0 --port 7860

 #!/bin/bash
+# Thiết lập home directory
 export HOME=/root
+# Kiểm tra xem Ollama đã chạy chưa
+echo "Checking if Ollama is already running..."
+if pgrep -x "ollama" > /dev/null; then
+    echo "Ollama is already running."
+else
+    echo "Starting Ollama server..."
+    ollama serve &
+    # Đợi Ollama khởi động
+    echo "Waiting for Ollama to start..."
+    sleep 15
+fi
+# Kiểm tra lại xem Ollama đã chạy chưa
+if ! pgrep -x "ollama" > /dev/null; then
+    echo "ERROR: Failed to start Ollama!"
+    exit 1
+fi
+# Tải mô hình nếu cần
 echo "Running pull_models.sh"
 /app/pull_models.sh
+# Kiểm tra kết nối đến Ollama server
+echo "Testing connection to Ollama server..."
+curl -s http://localhost:11434/api/version || {
+    echo "ERROR: Cannot connect to Ollama server!"
+    exit 1
+}
+# Bắt đầu ứng dụng FastAPI
 echo "Starting FastAPI application..."
 uvicorn app:app --host 0.0.0.0 --port 7860