Spaces:

MarcoLeung052
/

nursing-copilot-api

Sleeping

App Files Files Community

MarcoLeung052 commited on Feb 1

Commit

e4d2a60

verified ·

1 Parent(s): c770c0c

Update api_server.py

Browse files

Files changed (1) hide show

api_server.py +17 -51

api_server.py CHANGED Viewed

@@ -3,25 +3,14 @@
 from fastapi import FastAPI, HTTPException, Depends
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
-from transformers import GPT2LMHeadModel, GPT2Tokenizer
-import torch
 from backend.agent import run_agent
-# =================================================================
-# 1. 應用程式初始化與模型載入
-# =================================================================
-app = FastAPI(title="GPT-2 Nursing Completion API")
-# 設置 CORS：允許前端頁面 (localhost 或您的服務器 IP) 訪問
-# ⚠️ 注意：在生產環境中，請將 "http://localhost:5500" 替換為您的前端域名！
 origins = [
-    #"http://localhost:5500",  # 假設您使用 VS Code Live Server 或類似工具
-    #"http://127.0.0.1:5500",
-    # 這是您的 GitHub Pages 域名（標準格式）
-    "https://marcoleung052.github.io",
-    # 這是您的 GitHub Pages 子專案路徑 (如果使用子路徑)
     "https://marcoleung052.github.io/NursingRecordCompletion_test",
-    "*" # 為了測試方便，暫時允許所有來源
 ]
 app.add_middleware(
@@ -32,64 +21,41 @@ app.add_middleware(
     allow_headers=["*"],
 )
-# 全局變數用於存儲模型和分詞器
-tokenizer = None
-model = None
-MODEL_PATH = "gpt2" # 這裡可以替換為您微調後的模型資料夾路徑
-@app.on_event("startup")
-async def load_model():
-    """在應用啟動時載入 GPT-2 模型"""
-    global tokenizer, model
-    try:
-        # 載入分詞器
-        tokenizer = GPT2Tokenizer.from_pretrained(MODEL_PATH)
-        # 載入預訓練模型或您微調的模型權重
-        # 如果您的記憶體允許，可以考慮使用 GPU
-        # device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
-        model = GPT2LMHeadModel.from_pretrained(MODEL_PATH)
-        # model.to(device)
-        model.eval() # 設定為評估模式
-        print(f"✅ GPT-2 模型 {MODEL_PATH} 載入成功！")
-    except Exception as e:
-        print(f"❌ 模型載入失敗，請檢查 MODEL_PATH 或依賴庫是否安裝：{e}")
-# =================================================================
-# 2. API 請求與響應格式
-# =================================================================
 class PredictionRequest(BaseModel):
-    """前端發送的請求體格式"""
     prompt: str
     patient_id: str | None = None
     model: str | None = "gpt2-nursing"
 class PredictionResponse(BaseModel):
-    """後端回傳的響應體格式"""
     completions: list[str]
-# =================================================================
-# 3. 核心 API 端點 (已修改為生成 3 個序列)
-# =================================================================
 @app.post("/api/predict", response_model=PredictionResponse)
 def predict_completion(request: PredictionRequest):
     input_text = request.prompt
-    # 交給 agent 處理（固定 or AI）
     result = run_agent(input_text)
-    # agent 回傳的結果格式統一為 list
     return {"completions": result}
-# 運行伺服器
 if __name__ == "__main__":
     import uvicorn
-    # host 0.0.0.0 允許外部訪問，port 8000 與前端設定一致
     uvicorn.run("api_server:app", host="0.0.0.0", port=8000, reload=True)
 # =================================================================
 # 4. 資料庫設定（SQLite + SQLAlchemy）
 # =================================================================

 from fastapi import FastAPI, HTTPException, Depends
 from fastapi.middleware.cors import CORSMiddleware
 from pydantic import BaseModel
 from backend.agent import run_agent
+app = FastAPI(title="Nursing Copilot API")
 origins = [
+    "https://marcoleung052.github.io",
     "https://marcoleung052.github.io/NursingRecordCompletion_test",
+    "*"
 ]
 app.add_middleware(
     allow_headers=["*"],
 )
+# -----------------------------
+# Request / Response Models
+# -----------------------------
 class PredictionRequest(BaseModel):
     prompt: str
     patient_id: str | None = None
     model: str | None = "gpt2-nursing"
 class PredictionResponse(BaseModel):
     completions: list[str]
+# -----------------------------
+# API Endpoint
+# -----------------------------
 @app.post("/api/predict", response_model=PredictionResponse)
 def predict_completion(request: PredictionRequest):
     input_text = request.prompt
+    # ⭐ 交給 agent（固定 or AI）
     result = run_agent(input_text)
+    # ⭐ agent 統一回傳 list
     return {"completions": result}
+# -----------------------------
+# Run server
+# -----------------------------
 if __name__ == "__main__":
     import uvicorn
     uvicorn.run("api_server:app", host="0.0.0.0", port=8000, reload=True)
 # =================================================================
 # 4. 資料庫設定（SQLite + SQLAlchemy）
 # =================================================================